{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "ade0633c",
   "metadata": {},
   "source": [
    "QLearning使用表格估计Q函数,不便于扩展.\n",
    "\n",
    "所以使用神经网络估计Q函数."
   ]
  },
  {
   "cell_type": "code",
   "id": "91162df8",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:18.838396Z",
     "start_time": "2024-12-30T06:23:18.768458Z"
    }
   },
   "source": [
    "import gym\n",
    "\n",
    "\n",
    "#定义环境\n",
    "class MyWrapper(gym.Wrapper):\n",
    "\n",
    "    def __init__(self):\n",
    "        env = gym.make('CartPole-v1', render_mode='rgb_array')\n",
    "        super().__init__(env)\n",
    "        self.env = env\n",
    "        self.step_n = 0\n",
    "\n",
    "    def reset(self):\n",
    "        state, _ = self.env.reset()\n",
    "        self.step_n = 0\n",
    "        return state\n",
    "\n",
    "    def step(self, action):\n",
    "        state, reward, terminated, truncated, info = self.env.step(action)\n",
    "        over = terminated or truncated\n",
    "\n",
    "        #限制最大步数为200\n",
    "        self.step_n += 1\n",
    "        if self.step_n >= 200:\n",
    "            over = True\n",
    "\n",
    "        #没坚持到最后,扣分\n",
    "        if over and self.step_n < 200:\n",
    "            reward = -1000\n",
    "\n",
    "        return state, reward, over\n",
    "\n",
    "    #打印游戏图像\n",
    "    def show(self):\n",
    "        from matplotlib import pyplot as plt\n",
    "        plt.figure(figsize=(3, 3))\n",
    "        plt.imshow(self.env.render())\n",
    "        plt.show()\n",
    "\n",
    "\n",
    "env = MyWrapper()\n",
    "\n",
    "env.reset()\n",
    "\n",
    "env.show()"
   ],
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<Figure size 300x300 with 1 Axes>"
      ],
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAASAAAADMCAYAAADTcn7NAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuNSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/xnp5ZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAUNklEQVR4nO3dbUxb590G8MsGbMLLMYUUuzxgEWl9lqC8dCMJnFbP06l1wzpUNS0ftinqWBQlamaiplTRitSma7uJKvvQrVtKvrRJv2SZqMSmovSFkZZoigkNHRMhDWuldKAktpvyYAMJtvH5Px86TuuGpEDAN8bXTzpSzn3ftv/nDr7wOcfnYBERARGRAlbVBRBR+mIAEZEyDCAiUoYBRETKMICISBkGEBEpwwAiImUYQESkDAOIiJRhABGRMsoC6ODBgygvL0d2djaqqqrQ09OjqhQiUkRJAP35z39GY2MjnnvuOXz00UfYsGEDampqEAwGVZRDRIpYVFyMWlVVhU2bNuGPf/wjAMAwDJSVlWHPnj14+umnk10OESmSmewXjEaj6O3tRVNTk9lmtVrh8Xjg8/lmfEwkEkEkEjHXDcPAyMgIioqKYLFYFr1mIpobEcHY2BhKSkpgtd54RyvpAXTlyhXE43E4nc6EdqfTifPnz8/4mObmZjz//PPJKI+IFtDw8DBKS0tv2J/0AJqPpqYmNDY2muuhUAhutxvDw8PQNE1hZUQ0k3A4jLKyMuTn5990XNIDaOXKlcjIyEAgEEhoDwQCcLlcMz7GbrfDbrdf165pGgOIaAn7tkMkST8LZrPZUFlZic7OTrPNMAx0dnZC1/Vkl0NECinZBWtsbER9fT02btyIzZs343e/+x0mJiawfft2FeUQkSJKAujHP/4xPv/8c+zfvx9+vx933XUX3nnnnesOTBPR8qbke0C3KhwOw+FwIBQK8RgQ0RI02/corwUjImUYQESkDAOIiJRhABGRMgwgIlKGAUREyjCAiEgZBhARKcMAIiJlGEBEpAwDiIiUYQARkTIMICJShgFERMowgIhIGQYQESnDACIiZRhARKQMA4iIlGEAEZEyDCAiUoYBRETKMICISBkGEBEpwwAiImUYQESkDAOIiJRhABGRMnMOoJMnT+Khhx5CSUkJLBYL/vKXvyT0iwj279+PO+64AytWrIDH48Enn3ySMGZkZATbtm2DpmkoKCjAjh07MD4+fksbQkSpZ84BNDExgQ0bNuDgwYMz9h84cACvvPIKDh06hNOnTyM3Nxc1NTWYnJw0x2zbtg0DAwPo6OhAe3s7Tp48iV27ds1/K4goNcktACBtbW3mumEY4nK55Le//a3ZNjo6Kna7Xf70pz+JiMi5c+cEgHz44YfmmLffflssFotcvHhxVq8bCoUEgIRCoVspn4gWyWzfowt6DOjChQvw+/3weDxmm8PhQFVVFXw+HwDA5/OhoKAAGzduNMd4PB5YrVacPn16xueNRCIIh8MJCxGlvgUNIL/fDwBwOp0J7U6n0+zz+/0oLi5O6M/MzERhYaE55puam5vhcDjMpaysbCHLJiJFUuIsWFNTE0KhkLkMDw+rLomIFsCCBpDL5QIABAKBhPZAIGD2uVwuBIPBhP6pqSmMjIyYY77JbrdD07SEhYhS34IG0KpVq+ByudDZ2Wm2hcNhnD59GrquAwB0Xcfo6Ch6e3vNMSdOnIBhGKiqqlrIcohoicuc6wPGx8fx6aefmusXLlxAX18fCgsL4Xa7sXfvXvz617/GnXfeiVWrVuHZZ59FSUkJtm7dCgBYs2YNfvjDH2Lnzp04dOgQYrEYGhoa8JOf/AQlJSULtmFElALmenrt/fffFwDXLfX19SLy5an4Z599VpxOp9jtdrn//vtlcHAw4Tm++OIL+elPfyp5eXmiaZps375dxsbGFvwUHxGpMdv3qEVERGH+zUs4HIbD4UAoFOLxIKIlaLbv0ZQ4C0ZEyxMDiIiUYQARkTIMICJShgFERMowgIhIGQYQESnDACIiZRhARKQMA4iIlGEAEZEyDCAiUoYBRETKMICISBkGEBEpwwAiImUYQESkDAOIiJRhABGRMgwgIlJmzn+Wh2ghiQjG/Z8iOj5ittkdxcgrXqWwKkoWBhApJvD/8z2M/vufZsvta/6HAZQmuAtGSolhwIhPqS6DFGEAkVoikHhMdRWkCAOIlBIxYBj8BJSuGECklMRjiE9OJLRl2HIUVUPJxgAipeKxCKJXQwlt2be5FFVDycYAoiXGAmuGTXURlCRzCqDm5mZs2rQJ+fn5KC4uxtatWzE4OJgwZnJyEl6vF0VFRcjLy0NdXR0CgUDCmKGhIdTW1iInJwfFxcXYt28fpqZ4HIC+ZM1kAKWLOQVQV1cXvF4vuru70dHRgVgshi1btmBi4qt9+CeffBJvvfUWWltb0dXVhUuXLuHRRx81++PxOGpraxGNRnHq1Cm88cYbOHLkCPbv379wW0UpLSOLAZQ25BYEg0EBIF1dXSIiMjo6KllZWdLa2mqO+fjjjwWA+Hw+ERE5fvy4WK1W8fv95piWlhbRNE0ikcisXjcUCgkACYVCt1I+LQGT4Sty5rU90nNo53+WXRK+/InqsugWzfY9ekvHgEKhLw8eFhYWAgB6e3sRi8Xg8XjMMatXr4bb7YbP5wMA+Hw+rFu3Dk6n0xxTU1ODcDiMgYGBGV8nEokgHA4nLLQ8GPEYAPmqwQJYLBZl9VByzTuADMPA3r17cc8992Dt2rUAAL/fD5vNhoKCgoSxTqcTfr/fHPP18Jnun+6bSXNzMxwOh7mUlZXNt2xaYmQqBoh8+0BaluYdQF6vF2fPnsWxY8cWsp4ZNTU1IRQKmcvw8PCivyYlhxFnAKWzeV2M2tDQgPb2dpw8eRKlpaVmu8vlQjQaxejoaMKnoEAgAJfLZY7p6elJeL7ps2TTY77JbrfDbrfPp1Ra4oypGBg/6WtOn4BEBA0NDWhra8OJEyewalXiFcuVlZXIyspCZ2en2TY4OIihoSHoug4A0HUd/f39CAaD5piOjg5omoaKiopb2RZKQZGxzyFfuxQjw5aDDHuuwooomeb0Ccjr9eLo0aP461//ivz8fPOYjcPhwIoVK+BwOLBjxw40NjaisLAQmqZhz5490HUd1dXVAIAtW7agoqICjz32GA4cOAC/349nnnkGXq+Xn3LSUDxyNWEXLCMrGxm2FQoromSaUwC1tLQAAH7wgx8ktB8+fBg///nPAQAvv/wyrFYr6urqEIlEUFNTg1dffdUcm5GRgfb2duzevRu6riM3Nxf19fV44YUXbm1LaFmwWDNgtWaoLoOSxCKSekcAw+EwHA4HQqEQNE1TXQ7dAv8/38Nw95vmenbBHah45Gl+Ckpxs32P8lowWlIs1gxYrLxRZ7pgAJEyIgIRI6HNYrXCYuWPZbrg/zQpZUzxbojpjAFEShlTUdUlkEIMIFJIGEBpjgFESsVjkcQGXoiaVhhApIyI4NrIxYS2nML/YgilEQYQqSOScBkGgP98/4cBlC4YQLSk8H7Q6YUBREuKlbdjTSsMIFpS+AkovTCASB0xrrsZmcVq5S1Z0wgDiJQxjDgMI666DFKIAUTKSHwKYAClNQYQKSNGHMIASmsMIFLGiEW+cSmGBdYs3hUznTCASJnYtTCmIlfNdUtGJrK1YoUVUbIxgEixr86CWSwWWDKzFNZCycYAoiXEAmsGAyidMIBo6bBYYM3kFxHTCQOIlgyLxQJrBu8HnU4YQKSMEZ/hdqz8FnRaYQCRMrwbIjGASBkjxgBKd9zhpkUTjUZx9erVG/ZPjIUS1kUE4VAYmbGZd8NWrFjBP9+9zDCAaNG0tbXhqaeeumF//QMVeLiq3Fz/96Ugtv3vvRifnJpx/Isvvojt27cvdJmkEAOIFs3ExAQuXrx44wHx/8aFa+vxecyNoqyLCI2+h38PX8RkdOYAGh8fX6RKSZU5HQNqaWnB+vXroWkaNE2Drut4++23zf7JyUl4vV4UFRUhLy8PdXV1CAQCCc8xNDSE2tpa5OTkoLi4GPv27cPU1Mw/cLS8fXZtLf51dTNGYiX45GolBsPrYBjGtz+Qlo05BVBpaSleeukl9Pb24syZM7jvvvvw8MMPY2BgAADw5JNP4q233kJrayu6urpw6dIlPProo+bj4/E4amtrEY1GcerUKbzxxhs4cuQI9u/fv7BbRSlhIu6AmD+CVoxE8hE35KaPoeVlTrtgDz30UML6b37zG7S0tKC7uxulpaV47bXXcPToUdx3330AgMOHD2PNmjXo7u5GdXU13nvvPZw7dw5/+9vf4HQ6cdddd+HFF1/EL3/5S/zqV7+CzcZvwaYTl+0CsizXEJNsZFkiKLL+C4YwgNLJvI8BxeNxtLa2YmJiArquo7e3F7FYDB6PxxyzevVquN1u+Hw+VFdXw+fzYd26dXA6neaYmpoa7N69GwMDA/je9743pxrOnz+PvLy8+W4CLbLLly/ftL//7En4rwTwfzEXCrKCGL0y+M07tCbw+/04d+7cAldJi2G2x+vmHED9/f3QdR2Tk5PIy8tDW1sbKioq0NfXB5vNhoKCgoTxTqcTfr8fwJc/QF8Pn+n+6b4biUQiiES++gua4XAYABAKhXj8aAm72Sl4ADg1MAwMDM/6+SYnJzE6OnqLVVEyTExMzGrcnAPou9/9Lvr6+hAKhfDmm2+ivr4eXV1dcy5wLpqbm/H8889f115VVQVN0xb1tWn+zp8/v6DPV15ejrvvvntBn5MWx/SHhG8z529C22w2fOc730FlZSWam5uxYcMG/P73v4fL5UI0Gr3uN1QgEIDL5QIAuFyu686KTa9Pj5lJU1MTQqGQuQwPz/63JhEtXbd8KYZhGIhEIqisrERWVhY6OzvNvsHBQQwNDUHXdQCAruvo7+9HMBg0x3R0dEDTNFRUVNzwNex2u3nqf3ohotQ3p12wpqYmPPjgg3C73RgbG8PRo0fxwQcf4N1334XD4cCOHTvQ2NiIwsJCaJqGPXv2QNd1VFdXAwC2bNmCiooKPPbYYzhw4AD8fj+eeeYZeL1efsWeKA3NKYCCwSB+9rOf4fLly3A4HFi/fj3effddPPDAAwCAl19+GVarFXV1dYhEIqipqcGrr75qPj4jIwPt7e3YvXs3dF1Hbm4u6uvr8cILLyzsVtGSYLPZFvTTKn9JLT8WkdT74kU4HIbD4UAoFOLu2BI2MTGBkZGRBXu+goIC5OfnL9jz0eKZ7XuU14LRosnNzUVubq7qMmgJ4/2AiEgZBhARKcMAIiJlGEBEpAwDiIiUYQARkTIMICJShgFERMowgIhIGQYQESnDACIiZRhARKQMA4iIlGEAEZEyDCAiUoYBRETKMICISBkGEBEpwwAiImUYQESkDAOIiJRhABGRMgwgIlKGAUREyjCAiEgZBhARKcMAIiJlGEBEpAwDiIiUYQARkTKZqguYDxEBAITDYcWVENFMpt+b0+/VG0nJAPriiy8AAGVlZYorIaKbGRsbg8PhuGF/SgZQYWEhAGBoaOimG0eJwuEwysrKMDw8DE3TVJeTEjhn8yMiGBsbQ0lJyU3HpWQAWa1fHrpyOBz8oZgHTdM4b3PEOZu72Xw44EFoIlKGAUREyqRkANntdjz33HOw2+2qS0kpnLe545wtLot823kyIqJFkpKfgIhoeWAAEZEyDCAiUoYBRETKpGQAHTx4EOXl5cjOzkZVVRV6enpUl6RMc3MzNm3ahPz8fBQXF2Pr1q0YHBxMGDM5OQmv14uioiLk5eWhrq4OgUAgYczQ0BBqa2uRk5OD4uJi7Nu3D1NTU8ncFGVeeuklWCwW7N2712zjnCWJpJhjx46JzWaT119/XQYGBmTnzp1SUFAggUBAdWlK1NTUyOHDh+Xs2bPS19cnP/rRj8Ttdsv4+Lg55vHHH5eysjLp7OyUM2fOSHV1tdx9991m/9TUlKxdu1Y8Ho/84x//kOPHj8vKlSulqalJxSYlVU9Pj5SXl8v69evliSeeMNs5Z8mRcgG0efNm8Xq95no8HpeSkhJpbm5WWNXSEQwGBYB0dXWJiMjo6KhkZWVJa2urOebjjz8WAOLz+URE5Pjx42K1WsXv95tjWlpaRNM0iUQiyd2AJBobG5M777xTOjo65N577zUDiHOWPCm1CxaNRtHb2wuPx2O2Wa1WeDwe+Hw+hZUtHaFQCMBXF+z29vYiFoslzNnq1avhdrvNOfP5fFi3bh2cTqc5pqamBuFwGAMDA0msPrm8Xi9qa2sT5gbgnCVTSl2MeuXKFcTj8YT/dABwOp04f/68oqqWDsMwsHfvXtxzzz1Yu3YtAMDv98Nms6GgoCBhrNPphN/vN8fMNKfTfcvRsWPH8NFHH+HDDz+8ro9zljwpFUB0c16vF2fPnsXf//531aUsacPDw3jiiSfQ0dGB7Oxs1eWktZTaBVu5ciUyMjKuOxsRCATgcrkUVbU0NDQ0oL29He+//z5KS0vNdpfLhWg0itHR0YTxX58zl8s145xO9y03vb29CAaD+P73v4/MzExkZmaiq6sLr7zyCjIzM+F0OjlnSZJSAWSz2VBZWYnOzk6zzTAMdHZ2Qtd1hZWpIyJoaGhAW1sbTpw4gVWrViX0V1ZWIisrK2HOBgcHMTQ0ZM6Zruvo7+9HMBg0x3R0dEDTNFRUVCRnQ5Lo/vvvR39/P/r6+sxl48aN2LZtm/lvzlmSqD4KPlfHjh0Tu90uR44ckXPnzsmuXbukoKAg4WxEOtm9e7c4HA754IMP5PLly+Zy9epVc8zjjz8ubrdbTpw4IWfOnBFd10XXdbN/+pTyli1bpK+vT9555x25/fbb0+qU8tfPgolwzpIl5QJIROQPf/iDuN1usdlssnnzZunu7lZdkjIAZlwOHz5sjrl27Zr84he/kNtuu01ycnLkkUcekcuXLyc8z2effSYPPvigrFixQlauXClPPfWUxGKxJG+NOt8MIM5ZcvB2HESkTEodAyKi5YUBRETKMICISBkGEBEpwwAiImUYQESkDAOIiJRhABGRMgwgIlKGAUREyjCAiEgZBhARKfP/gN7ETv2j+D4AAAAASUVORK5CYII="
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "execution_count": 5
  },
  {
   "cell_type": "code",
   "id": "ecfbe912",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:18.851433Z",
     "start_time": "2024-12-30T06:23:18.845900Z"
    }
   },
   "source": [
    "import torch\n",
    "\n",
    "#定义模型,评估状态下每个动作的价值\n",
    "# 输入层（4个特征）：接收环境的状态。状态通常是环境中描述当前局面的变量，比如在 CartPole-v1 中，状态有4个变量（位置、速度、杆角度和角速度）。\n",
    "model = torch.nn.Sequential(\n",
    "    # 第一层：将输入的 4 个数字转化为 64 个特征。输入层：4 个特征。两层隐藏层：每层 64 个神经元。\n",
    "    torch.nn.Linear(4, 64),\n",
    "    # ReLU 激活函数：将 64 个特征中的负数值变成 0。\n",
    "    torch.nn.ReLU(),\n",
    "    # 第二层：对 64 个特征进一步处理，仍然输出 64 个特征。\n",
    "    torch.nn.Linear(64, 64),\n",
    "    # ReLU 激活函数：将 64 个特征中的负数值变成 0。\n",
    "    torch.nn.ReLU(),\n",
    "    # 将 64 个特征转化为最终的 2 个值，表示两个动作的价值。输出层（2个动作）：输出的是每个动作（比如向左或向右）的 Q值。\n",
    "    torch.nn.Linear(64, 2),\n",
    ")\n",
    "\n",
    "model"
   ],
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Sequential(\n",
       "  (0): Linear(in_features=4, out_features=64, bias=True)\n",
       "  (1): ReLU()\n",
       "  (2): Linear(in_features=64, out_features=64, bias=True)\n",
       "  (3): ReLU()\n",
       "  (4): Linear(in_features=64, out_features=2, bias=True)\n",
       ")"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 6
  },
  {
   "cell_type": "code",
   "id": "84cbf0ff",
   "metadata": {
    "scrolled": true,
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:19.020451Z",
     "start_time": "2024-12-30T06:23:18.941254Z"
    }
   },
   "source": [
    "from IPython import display\n",
    "import random\n",
    "\n",
    "\n",
    "def play(show=False):\n",
    "    # 初始化数据列表，用于存储每一步的状态-动作-奖励数据\n",
    "    data = []\n",
    "    # 初始化总奖励计数器\n",
    "    reward_sum = 0\n",
    "\n",
    "    # 重置环境，获取初始状态\n",
    "    state = env.reset()\n",
    "    # 游戏是否结束的标志\n",
    "    over = False\n",
    "\n",
    "    # 游戏主循环，直到游戏结束\n",
    "    while not over:\n",
    "        # 使用模型预测当前状态下的动作\n",
    "        # 将状态转换为张量，送入模型，选择Q值最大的动作\n",
    "        '''\n",
    "        这句代码的完整逻辑是：\n",
    "        将当前状态 state 转换为 PyTorch 张量（形状为 [1, 4]）。\n",
    "        使用神经网络模型预测每个动作的 Q 值（输出是一个大小为 [1, 2] 的张量）。\n",
    "        找到 Q 值最大的索引（动作的编号）。\n",
    "        将这个索引转换为普通整数，作为智能体选择的动作。\n",
    "        \n",
    "        torch.FloatTensor(state)\n",
    "        将当前的环境状态 state 转换为 PyTorch 的浮点数张量（FloatTensor）。\n",
    "        在强化学习中，state 是环境的当前状态，比如在 CartPole-v1 环境中，它是一个包含 4 个值的数组，表示：\n",
    "        小车的水平位置。\n",
    "        小车的速度。\n",
    "        杆的角度。\n",
    "        杆的角速度。\n",
    "        state 是一个 NumPy 数组或普通列表，神经网络的输入必须是 PyTorch 的张量，因此需要转换。\n",
    "        \n",
    "        .reshape(1, 4)\n",
    "        将张量 state 的形状从 [4] 改变为 [1, 4]。\n",
    "        原始的 state 是一个一维张量，形状为 [4]，表示4个状态变量。\n",
    "        神经网络的输入通常是二维张量，其中：\n",
    "        第一维：表示样本的批次大小（batch size），在这里是 1（只有一个状态输入）。\n",
    "        第二维：表示每个样本的特征数（这里是4个状态变量）。\n",
    "        通过 .reshape(1, 4)，确保输入张量的形状符合模型的输入要求。\n",
    "        \n",
    "        model(...)\n",
    "        调用神经网络模型 (model) 对状态进行前向传播，预测每个动作的 Q 值。\n",
    "        model 是一个深度神经网络（DNN），用来近似 Q 值函数 \n",
    "        Q(s,a)。它的输入是当前状态 \n",
    "        s，输出是所有可能动作的 Q 值。\n",
    "        例如，在 CartPole-v1 环境中，智能体可以执行两个动作（0: 向左移动，1: 向右移动），模型会输出两个 Q 值：\n",
    "        \n",
    "        .argmax()\n",
    "        获取模型输出中 Q 值最大的索引（对应的动作）。\n",
    "        模型输出的形式：一个张量，例如 [1.5, 3.2]，表示两个动作的 Q 值分别为 1.5 和 3.2。\n",
    "        .argmax() 的作用是找到 Q 值最大的动作索引。在这个例子中，索引 1 对应的 Q 值为 3.2，是最大的值，因此 argmax() 返回 1。\n",
    "        这个索引对应于当前状态下智能体选择的最优动作。\n",
    "        \n",
    "        .item()\n",
    "        将索引从 PyTorch 的张量格式转换为 Python 的普通整数。\n",
    "        PyTorch 中的 argmax() 返回的是一个张量，例如 tensor(1)，为了将其作为普通整数使用，需要调用 .item() 方法。\n",
    "        '''\n",
    "        action = model(torch.FloatTensor(state).reshape(1, 4)).argmax().item()\n",
    "        print('1=', state)\n",
    "        print('2=', model(torch.FloatTensor(state).reshape(1, 4)))\n",
    "        print('3=', model(torch.FloatTensor(state).reshape(1, 4)).argmax())\n",
    "        print('4=', action)\n",
    "\n",
    "        # 以10%的概率随机选择一个动作（探索，epsilon-greedy策略）\n",
    "        if random.random() < 0.1:\n",
    "            action = env.action_space.sample()\n",
    "\n",
    "        # 执行动作，获取下一状态、奖励、游戏是否结束\n",
    "        next_state, reward, over = env.step(action)\n",
    "\n",
    "        # 将当前状态、动作、奖励、下一状态和游戏结束标志存入数据列表\n",
    "        data.append((state, action, reward, next_state, over))\n",
    "        # 累加本次动作的奖励到总奖励\n",
    "        reward_sum += reward\n",
    "\n",
    "        # 更新当前状态为下一状态\n",
    "        state = next_state\n",
    "\n",
    "        # 如果设置了显示标志，则实时显示游戏画面\n",
    "        if show:\n",
    "            display.clear_output(wait=True)\n",
    "            env.show()\n",
    "\n",
    "    # 返回采集的数据（用于训练）和本局游戏的总奖励\n",
    "    return data, reward_sum\n",
    "\n",
    "\n",
    "# 调用play函数运行游戏，并输出总奖励\n",
    "play()[-1]\n"
   ],
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1= [ 0.0410597  -0.0009886  -0.04174996 -0.0328249 ]\n",
      "2= tensor([[-0.0906,  0.0214]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04103993  0.19470643 -0.04240646 -0.33838257]\n",
      "2= tensor([[-0.0983,  0.0431]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04493406  0.39040536 -0.04917411 -0.6441308 ]\n",
      "2= tensor([[-0.1033,  0.0496]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05274216  0.5861769  -0.06205673 -0.9518845 ]\n",
      "2= tensor([[-0.1096,  0.0599]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0644657   0.7820766  -0.08109441 -1.2634014 ]\n",
      "2= tensor([[-0.1177,  0.0651]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08010723  0.9781362  -0.10636245 -1.5803399 ]\n",
      "2= tensor([[-0.1349,  0.0685]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09966996  1.1743516  -0.13796924 -1.9042114 ]\n",
      "2= tensor([[-0.1594,  0.0694]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12315699  1.3706689  -0.17605346 -2.2363236 ]\n",
      "2= tensor([[-0.1883,  0.0680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "D:\\app\\anaconda3\\install\\envs\\pytorch_env_3_8\\lib\\site-packages\\gym\\utils\\passive_env_checker.py:233: DeprecationWarning: `np.bool8` is a deprecated alias for `np.bool_`.  (Deprecated NumPy 1.24)\n",
      "  if not isinstance(terminated, (bool, np.bool8)):\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "-993.0"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 7
  },
  {
   "cell_type": "code",
   "id": "95ce610e",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:19.139394Z",
     "start_time": "2024-12-30T06:23:19.030662Z"
    }
   },
   "source": [
    "#数据池\n",
    "class Pool:\n",
    "    \"\"\"\n",
    "    用于存储和管理经验数据的类（经验回放池）。\n",
    "    经验池在DQN中是关键组件，通过保存和采样历史经验来打破样本之间的时间相关性。\n",
    "    \"\"\"\n",
    "\n",
    "    def __init__(self):\n",
    "        \"\"\"\n",
    "        初始化经验池。\n",
    "        \"\"\"\n",
    "        self.pool = []  # 存储经验数据的列表，每条经验是一个五元组：(state, action, reward, next_state, over)\n",
    "\n",
    "    def __len__(self):\n",
    "        \"\"\"\n",
    "        获取经验池的当前大小。\n",
    "        \"\"\"\n",
    "        return len(self.pool)  # 返回经验池中存储的经验数量\n",
    "\n",
    "    def __getitem__(self, i):\n",
    "        \"\"\"\n",
    "        按索引获取经验池中的某条经验。\n",
    "        \"\"\"\n",
    "        return self.pool[i]  # 返回第 i 条经验\n",
    "\n",
    "    # 更新动作池\n",
    "    def update(self):\n",
    "        \"\"\"\n",
    "        更新经验池，添加新的经验数据。\n",
    "        \"\"\"\n",
    "        # 保存更新前的经验池大小\n",
    "        old_len = len(self.pool)\n",
    "\n",
    "        # 确保每次更新至少增加200条新数据\n",
    "        while len(self.pool) - old_len < 200:\n",
    "            # 通过调用 play() 收集新经验，并将状态-动作-奖励等信息添加到经验池中\n",
    "            self.pool.extend(play()[0])\n",
    "\n",
    "        # 只保留最近的 20000 条经验，丢弃更旧的经验\n",
    "        self.pool = self.pool[-2_0000:]\n",
    "\n",
    "    # 获取一批数据样本\n",
    "    def sample(self):\n",
    "        \"\"\"\n",
    "        从经验池中随机采样一批数据，用于模型训练。\n",
    "        \"\"\"\n",
    "        # 从经验池中随机采样 64 条经验\n",
    "        data = random.sample(self.pool, 64)\n",
    "\n",
    "        # 将采样的数据拆分为状态、动作、奖励、下一状态和结束标志\n",
    "        state = torch.FloatTensor([i[0] for i in data]).reshape(-1, 4)  # 提取状态并转换为形状为 [64, 4] 的张量\n",
    "        action = torch.LongTensor([i[1] for i in data]).reshape(-1, 1)  # 提取动作并转换为形状为 [64, 1] 的张量\n",
    "        reward = torch.FloatTensor([i[2] for i in data]).reshape(-1, 1)  # 提取奖励并转换为形状为 [64, 1] 的张量\n",
    "        next_state = torch.FloatTensor([i[3] for i in data]).reshape(-1, 4)  # 提取下一状态并转换为 [64, 4] 的张量\n",
    "        over = torch.LongTensor([i[4] for i in data]).reshape(-1, 1)  # 提取结束标志并转换为形状为 [64, 1] 的张量\n",
    "\n",
    "        # 返回采样的数据，分别为状态、动作、奖励、下一状态和结束标志\n",
    "        return state, action, reward, next_state, over\n",
    "\n",
    "\n",
    "# 初始化经验池\n",
    "pool = Pool()\n",
    "\n",
    "# 更新经验池，添加新数据\n",
    "pool.update()\n",
    "\n",
    "# 从经验池中采样一批数据\n",
    "pool.sample()\n",
    "\n",
    "# 打印经验池的大小和第一条经验数据\n",
    "len(pool), pool[0]\n"
   ],
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1= [ 0.00487011  0.00548145 -0.04611025 -0.01432442]\n",
      "2= tensor([[-0.0914,  0.0231]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00497974  0.20123331 -0.04639674 -0.32119173]\n",
      "2= tensor([[-0.0998,  0.0455]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00900441  0.39698422 -0.05282057 -0.6281379 ]\n",
      "2= tensor([[-0.1047,  0.0517]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01694409  0.59280205 -0.06538333 -0.93697697]\n",
      "2= tensor([[-0.1106,  0.0615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02880013  0.7887418  -0.08412287 -1.2494676 ]\n",
      "2= tensor([[-0.1175,  0.0671]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04457497  0.98483527 -0.10911222 -1.5672706 ]\n",
      "2= tensor([[-0.1348,  0.0707]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06427167  1.1810784  -0.14045763 -1.8919002 ]\n",
      "2= tensor([[-0.1594,  0.0713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08789325  1.3774179  -0.17829564 -2.224668  ]\n",
      "2= tensor([[-0.1884,  0.0699]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04224421  0.04700354  0.00770026 -0.03975704]\n",
      "2= tensor([[-0.0958,  0.0288]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04130414  0.24201423  0.00690512 -0.33000055]\n",
      "2= tensor([[-0.0996,  0.0487]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-3.6463857e-02  4.3703720e-01  3.0511327e-04 -6.2049794e-01]\n",
      "2= tensor([[-0.1023,  0.0544]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02772311  0.241911   -0.01210485 -0.32771894]\n",
      "2= tensor([[-0.0998,  0.0486]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02288489  0.43720317 -0.01865922 -0.6241945 ]\n",
      "2= tensor([[-0.1032,  0.0542]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01414083  0.6325806  -0.03114311 -0.9226951 ]\n",
      "2= tensor([[-0.1081,  0.0652]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00148922  0.82810915 -0.04959701 -1.2250003 ]\n",
      "2= tensor([[-0.1155,  0.0721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01507297  1.0238335  -0.07409702 -1.5328013 ]\n",
      "2= tensor([[-0.1300,  0.0774]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03554964  1.2197659  -0.10475305 -1.8476582 ]\n",
      "2= tensor([[-0.1529,  0.0782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05994495  1.4158741  -0.14170621 -2.170949  ]\n",
      "2= tensor([[-0.1811,  0.0772]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08826244  1.6120654  -0.18512519 -2.5038087 ]\n",
      "2= tensor([[-0.2105,  0.0745]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01082981 -0.0055708  -0.01993496 -0.04202086]\n",
      "2= tensor([[-0.0917,  0.0225]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0107184   0.18983126 -0.02077538 -0.3409262 ]\n",
      "2= tensor([[-0.0987,  0.0439]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01451502  0.38524255 -0.0275939  -0.64008737]\n",
      "2= tensor([[-0.1034,  0.0498]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02221988  0.5807381  -0.04039565 -0.9413307 ]\n",
      "2= tensor([[-0.1082,  0.0602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03383464  0.77638054 -0.05922227 -1.246428  ]\n",
      "2= tensor([[-0.1155,  0.0666]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04936225  0.97220993 -0.08415082 -1.5570582 ]\n",
      "2= tensor([[-0.1319,  0.0709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06880645  1.1682329  -0.11529199 -1.8747634 ]\n",
      "2= tensor([[-0.1551,  0.0721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0921711   1.3644092  -0.15278725 -2.2008953 ]\n",
      "2= tensor([[-0.1835,  0.0711]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11945929  1.5606366  -0.19680516 -2.5365524 ]\n",
      "2= tensor([[-0.2132,  0.0682]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04612847 -0.00165535 -0.013187   -0.00131287]\n",
      "2= tensor([[-0.0928,  0.0250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04616158  0.19365321 -0.01321326 -0.2981271 ]\n",
      "2= tensor([[-0.1004,  0.0466]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04228852  0.388961   -0.0191758  -0.5949478 ]\n",
      "2= tensor([[-0.1031,  0.0539]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0345093   0.19411261 -0.03107476 -0.3083663 ]\n",
      "2= tensor([[-0.1006,  0.0466]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03062705  0.38966325 -0.03724208 -0.6106851 ]\n",
      "2= tensor([[-0.1044,  0.0534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02283378  0.5852854  -0.04945579 -0.91486156]\n",
      "2= tensor([[-0.1094,  0.0625]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01112807  0.7810401  -0.06775302 -1.2226686 ]\n",
      "2= tensor([[-0.1158,  0.0691]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00449273  0.9769663  -0.09220639 -1.5357878 ]\n",
      "2= tensor([[-0.1321,  0.0734]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02403205  1.1730696  -0.12292214 -1.8557636 ]\n",
      "2= tensor([[-0.1554,  0.0742]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04749345  1.369309   -0.16003741 -2.1839495 ]\n",
      "2= tensor([[-0.1840,  0.0731]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07487962  1.5655808  -0.20371641 -2.5214458 ]\n",
      "2= tensor([[-0.2143,  0.0696]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00420663  0.01504847 -0.01353978  0.01713522]\n",
      "2= tensor([[-0.0921,  0.0227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0045076  -0.17987671 -0.01319707  0.30551562]\n",
      "2= tensor([[-0.0763, -0.0054]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00091007  0.01543079 -0.00708676  0.00870005]\n",
      "2= tensor([[-0.0924,  0.0230]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00121868  0.21065365 -0.00691276 -0.2862104 ]\n",
      "2= tensor([[-0.0987,  0.0451]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00543175  0.4058735  -0.01263697 -0.5810655 ]\n",
      "2= tensor([[-0.1013,  0.0518]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01354922  0.60117024 -0.02425828 -0.87770236]\n",
      "2= tensor([[-0.1063,  0.0632]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02557263  0.7966133  -0.04181232 -1.177912  ]\n",
      "2= tensor([[-0.1140,  0.0701]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04150489  0.9922526  -0.06537057 -1.4834037 ]\n",
      "2= tensor([[-0.1264,  0.0757]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06134995  0.7979859  -0.09503864 -1.2118313 ]\n",
      "2= tensor([[-0.1185,  0.0672]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07730967  0.9941974  -0.11927526 -1.5327197 ]\n",
      "2= tensor([[-0.1336,  0.0707]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09719361  1.1905377  -0.14992966 -1.8601214 ]\n",
      "2= tensor([[-0.1579,  0.0716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12100437  1.3869529  -0.18713209 -2.1953533 ]\n",
      "2= tensor([[-0.1869,  0.0702]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0214668   0.02098413  0.03826952  0.01477628]\n",
      "2= tensor([[-0.0936,  0.0246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02104712  0.21553695  0.03856505 -0.2655908 ]\n",
      "2= tensor([[-0.0980,  0.0452]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01673638  0.41008785  0.03325323 -0.5458648 ]\n",
      "2= tensor([[-0.0980,  0.0526]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00853462  0.6047272   0.02233593 -0.8278878 ]\n",
      "2= tensor([[-0.1031,  0.0645]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00355992  0.79953676  0.00577818 -1.113463  ]\n",
      "2= tensor([[-0.1084,  0.0734]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01955066  0.99458236 -0.01649108 -1.4043278 ]\n",
      "2= tensor([[-0.1191,  0.0802]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0394423   1.1899052  -0.04457764 -1.7021203 ]\n",
      "2= tensor([[-0.1374,  0.0840]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0632404   1.3855112  -0.07862004 -2.0083394 ]\n",
      "2= tensor([[-0.1619,  0.0840]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09095063  1.5813586  -0.11878683 -2.3242934 ]\n",
      "2= tensor([[-0.1899,  0.0825]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1225778  1.7773421 -0.1652727 -2.6510384]\n",
      "2= tensor([[-0.2175,  0.0807]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04586304  0.03249586 -0.0179144   0.02087452]\n",
      "2= tensor([[-0.0904,  0.0223]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04651296  0.22787008 -0.01749691 -0.27740633]\n",
      "2= tensor([[-0.0976,  0.0442]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05107036  0.42323723 -0.02304504 -0.57555604]\n",
      "2= tensor([[-0.0993,  0.0517]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05953511  0.22844577 -0.03455615 -0.29022107]\n",
      "2= tensor([[-0.0976,  0.0440]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06410402  0.424043   -0.04036058 -0.59359926]\n",
      "2= tensor([[-0.1001,  0.0516]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07258488  0.619706   -0.05223256 -0.89871746]\n",
      "2= tensor([[-0.1076,  0.0634]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08497901  0.81549543 -0.07020691 -1.2073506 ]\n",
      "2= tensor([[-0.1174,  0.0681]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10128891  1.0114506  -0.09435392 -1.5211831 ]\n",
      "2= tensor([[-0.1305,  0.0724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12151793  1.2075777  -0.12477759 -1.841764  ]\n",
      "2= tensor([[-0.1533,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14566948  1.4038364  -0.16161287 -2.1704528 ]\n",
      "2= tensor([[-0.1819,  0.0727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1737462   1.6001245  -0.20502192 -2.5083559 ]\n",
      "2= tensor([[-0.2105,  0.0708]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00165683  0.03186763 -0.00011815 -0.00777434]\n",
      "2= tensor([[-0.0932,  0.0250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-1.0194770e-03  2.2699128e-01 -2.7363602e-04 -3.0049455e-01]\n",
      "2= tensor([[-0.0985,  0.0460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00352035  0.4221171  -0.00628353 -0.59326375]\n",
      "2= tensor([[-0.1010,  0.0524]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01196269  0.6173265  -0.0181488  -0.8879193 ]\n",
      "2= tensor([[-0.1060,  0.0641]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02430922  0.81268996 -0.03590719 -1.1862518 ]\n",
      "2= tensor([[-0.1139,  0.0711]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04056302  1.0082587  -0.05963222 -1.4899702 ]\n",
      "2= tensor([[-0.1262,  0.0770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0607282   1.2040539  -0.08943163 -1.8006625 ]\n",
      "2= tensor([[-0.1477,  0.0787]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08480927  1.4000547  -0.12544487 -2.1197467 ]\n",
      "2= tensor([[-0.1750,  0.0781]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11281037  1.5961838  -0.16783981 -2.4484127 ]\n",
      "2= tensor([[-0.2040,  0.0757]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04099942 -0.03761211 -0.03004561  0.00503206]\n",
      "2= tensor([[-0.0904,  0.0224]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04175166  0.15792756 -0.02994497 -0.29697716]\n",
      "2= tensor([[-0.1008,  0.0448]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03859311  0.35346332 -0.03588451 -0.5989518 ]\n",
      "2= tensor([[-0.1042,  0.0526]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03152385  0.54906845 -0.04786355 -0.9027184 ]\n",
      "2= tensor([[-0.1091,  0.0605]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02054248  0.744805   -0.06591792 -1.2100534 ]\n",
      "2= tensor([[-0.1151,  0.0676]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00564638  0.9407133  -0.09011899 -1.5226436 ]\n",
      "2= tensor([[-0.1315,  0.0719]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01316789  1.1368009  -0.12057186 -1.8420405 ]\n",
      "2= tensor([[-0.1541,  0.0727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0359039   1.3330294  -0.15741266 -2.1696086 ]\n",
      "2= tensor([[-0.1826,  0.0717]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06256449  1.5292989  -0.20080484 -2.5064614 ]\n",
      "2= tensor([[-0.2131,  0.0680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01052872  0.0317057  -0.03895787  0.00922835]\n",
      "2= tensor([[-0.0929,  0.0250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00989461  0.22736408 -0.0387733  -0.29548725]\n",
      "2= tensor([[-0.1001,  0.0475]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00534733  0.42301673 -0.04468305 -0.6001421 ]\n",
      "2= tensor([[-0.1037,  0.0540]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00311301  0.61873436 -0.05668589 -0.90655804]\n",
      "2= tensor([[-0.1098,  0.0644]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01548769  0.81457615 -0.07481705 -1.2165055 ]\n",
      "2= tensor([[-0.1170,  0.0703]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03177922  1.010579   -0.09914716 -1.5316631 ]\n",
      "2= tensor([[-0.1321,  0.0747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0519908   1.2067463  -0.12978043 -1.8535706 ]\n",
      "2= tensor([[-0.1559,  0.0754]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07612573  1.4030344  -0.16685183 -2.183575  ]\n",
      "2= tensor([[-0.1846,  0.0741]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00072435  0.01503699 -0.03496476  0.02324755]\n",
      "2= tensor([[-0.0916,  0.0229]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00102509  0.21064247 -0.03449981 -0.2802589 ]\n",
      "2= tensor([[-0.0996,  0.0458]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00523794  0.40623912 -0.04010499 -0.58362025]\n",
      "2= tensor([[-0.1030,  0.0528]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01336273  0.6018993  -0.05177739 -0.88866216]\n",
      "2= tensor([[-0.1088,  0.0634]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02540071  0.79768425 -0.06955064 -1.1971618 ]\n",
      "2= tensor([[-0.1163,  0.0693]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0413544   0.99363405 -0.09349387 -1.5108073 ]\n",
      "2= tensor([[-0.1304,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06122708  1.189756   -0.12371002 -1.8311527 ]\n",
      "2= tensor([[-0.1533,  0.0751]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0850222   1.3860118  -0.16033307 -2.1595645 ]\n",
      "2= tensor([[-0.1818,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11274243  1.5823015  -0.20352437 -2.497159  ]\n",
      "2= tensor([[-0.2112,  0.0713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02598374  0.01676381  0.00089372 -0.03519315]\n",
      "2= tensor([[-0.0918,  0.0234]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 2.6319019e-02  2.1187294e-01  1.8985455e-04 -3.2759398e-01]\n",
      "2= tensor([[-0.0975,  0.0438]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03055648  0.40699217 -0.00636202 -0.620217  ]\n",
      "2= tensor([[-0.1007,  0.0500]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03869632  0.21195966 -0.01876637 -0.32954457]\n",
      "2= tensor([[-0.0977,  0.0436]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04293551  0.40734366 -0.02535726 -0.628086  ]\n",
      "2= tensor([[-0.1013,  0.0501]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05108239  0.60281014 -0.03791898 -0.9286457 ]\n",
      "2= tensor([[-0.1072,  0.0616]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06313859  0.79842293 -0.05649189 -1.2329994 ]\n",
      "2= tensor([[-0.1162,  0.0673]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07910705  0.99422395 -0.08115188 -1.5428321 ]\n",
      "2= tensor([[-0.1306,  0.0719]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09899153  1.1902221  -0.11200852 -1.8596944 ]\n",
      "2= tensor([[-0.1533,  0.0733]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12279597  1.3863806  -0.1492024  -2.1849499 ]\n",
      "2= tensor([[-0.1817,  0.0724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.15052359  1.5826011  -0.1929014  -2.5197136 ]\n",
      "2= tensor([[-0.2105,  0.0702]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01607406  0.04072457 -0.04748269  0.02117624]\n",
      "2= tensor([[-0.0920,  0.0241]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01688855  0.23649417 -0.04705917 -0.28610188]\n",
      "2= tensor([[-0.0995,  0.0469]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02161843  0.04207385 -0.0527812  -0.00862452]\n",
      "2= tensor([[-0.0923,  0.0250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02245991  0.23791146 -0.05295369 -0.31748232]\n",
      "2= tensor([[-0.0995,  0.0470]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02721814  0.4337461  -0.05930334 -0.6263836 ]\n",
      "2= tensor([[-0.1033,  0.0536]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03589306  0.6296435  -0.07183101 -0.93713814]\n",
      "2= tensor([[-0.1107,  0.0639]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04848593  0.8256567  -0.09057377 -1.2514999 ]\n",
      "2= tensor([[-0.1190,  0.0688]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06499907  1.021815   -0.11560377 -1.5711234 ]\n",
      "2= tensor([[-0.1354,  0.0723]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08543536  1.2181112  -0.14702624 -1.8975143 ]\n",
      "2= tensor([[-0.1606,  0.0727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10979759  1.4144884  -0.18497653 -2.2319725 ]\n",
      "2= tensor([[-0.1896,  0.0710]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03051698  0.03804848 -0.02369151  0.02549445]\n",
      "2= tensor([[-0.0913,  0.0231]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03127795  0.23350203 -0.02318162 -0.27456826]\n",
      "2= tensor([[-0.0983,  0.0453]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03594799  0.42894694 -0.02867298 -0.5744716 ]\n",
      "2= tensor([[-0.1002,  0.0528]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04452692  0.6244589  -0.04016241 -0.87604773]\n",
      "2= tensor([[-0.1069,  0.0645]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0570161   0.82010305 -0.05768337 -1.1810819 ]\n",
      "2= tensor([[-0.1158,  0.0702]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07341816  0.62577534 -0.081305   -0.9070246 ]\n",
      "2= tensor([[-0.1101,  0.0637]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08593367  0.82189834 -0.0994455  -1.2241147 ]\n",
      "2= tensor([[-0.1197,  0.0678]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10237164  1.0181504  -0.12392779 -1.5462272 ]\n",
      "2= tensor([[-0.1345,  0.0709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12273464  1.2145237  -0.15485233 -1.8748696 ]\n",
      "2= tensor([[-0.1593,  0.0717]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14702512  1.4109602  -0.19234973 -2.2113435 ]\n",
      "2= tensor([[-0.1884,  0.0701]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04965112 -0.04625352  0.0491771  -0.03137599]\n",
      "2= tensor([[-0.0894,  0.0174]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04872605  0.14812997  0.04854958 -0.3081465 ]\n",
      "2= tensor([[-0.0952,  0.0378]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05168865  0.34252775  0.04238665 -0.5851316 ]\n",
      "2= tensor([[-0.0967,  0.0451]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05853921  0.5370311   0.03068402 -0.8641667 ]\n",
      "2= tensor([[-0.0999,  0.0579]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06927983  0.73172224  0.01340069 -1.1470462 ]\n",
      "2= tensor([[-0.1082,  0.0657]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08391427  0.9266667  -0.00954024 -1.4354969 ]\n",
      "2= tensor([[-0.1184,  0.0728]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10244761  0.73166364 -0.03825017 -1.1458105 ]\n",
      "2= tensor([[-0.1123,  0.0640]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11708088  0.92726374 -0.06116639 -1.4502388 ]\n",
      "2= tensor([[-0.1238,  0.0690]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.13562615  1.1230818  -0.09017116 -1.7613882 ]\n",
      "2= tensor([[-0.1427,  0.0721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.15808779  1.319101   -0.12539892 -2.080697  ]\n",
      "2= tensor([[-0.1704,  0.0715]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.18446982  1.5152498  -0.16701287 -2.4093807 ]\n",
      "2= tensor([[-0.1988,  0.0701]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02181497 -0.00760562  0.02448019  0.00883108]\n",
      "2= tensor([[-0.0908,  0.0205]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02166286  0.18715686  0.02465681 -0.27602863]\n",
      "2= tensor([[-0.0970,  0.0419]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.025406    0.3819185   0.01913624 -0.56083393]\n",
      "2= tensor([[-0.0983,  0.0491]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03304437  0.5767667   0.00791956 -0.84742707]\n",
      "2= tensor([[-0.1026,  0.0615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0445797   0.7717798  -0.00902898 -1.1376091 ]\n",
      "2= tensor([[-0.1103,  0.0690]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0600153   0.9670186  -0.03178116 -1.43311   ]\n",
      "2= tensor([[-0.1205,  0.0760]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07935567  1.1625179  -0.06044336 -1.7355529 ]\n",
      "2= tensor([[-0.1399,  0.0789]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10260603  1.3582748  -0.09515442 -2.0464115 ]\n",
      "2= tensor([[-0.1657,  0.0787]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12977153  1.5542356  -0.13608265 -2.3669562 ]\n",
      "2= tensor([[-0.1941,  0.0770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.16085623  1.7502797  -0.18342178 -2.6981885 ]\n",
      "2= tensor([[-0.2216,  0.0755]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02026726  0.00153479 -0.00654734  0.04084767]\n",
      "2= tensor([[-0.0907,  0.0202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02029796  0.19675002 -0.00573038 -0.2538938 ]\n",
      "2= tensor([[-0.0981,  0.0432]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02423296  0.39195332 -0.01080826 -0.54837865]\n",
      "2= tensor([[-0.0998,  0.0509]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03207203  0.58722544 -0.02177583 -0.84444726]\n",
      "2= tensor([[-0.1048,  0.0624]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04381654  0.78263766 -0.03866478 -1.1438977 ]\n",
      "2= tensor([[-0.1130,  0.0692]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05946929  0.9782428  -0.06154273 -1.4484508 ]\n",
      "2= tensor([[-0.1241,  0.0752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07903414  1.1740651  -0.09051175 -1.7597102 ]\n",
      "2= tensor([[-0.1445,  0.0775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10251544  1.3700877  -0.12570596 -2.079115  ]\n",
      "2= tensor([[-0.1717,  0.0769]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1299172   1.5662392  -0.16728824 -2.4078808 ]\n",
      "2= tensor([[-0.2005,  0.0748]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00925919  0.03804979 -0.01251205  0.04271087]\n",
      "2= tensor([[-0.0922,  0.0235]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01002019  0.2333489  -0.01165783 -0.25389332]\n",
      "2= tensor([[-0.0986,  0.0460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01468717  0.42863536 -0.0167357  -0.5502304 ]\n",
      "2= tensor([[-0.1000,  0.0535]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02325987  0.62398833 -0.02774031 -0.8481389 ]\n",
      "2= tensor([[-0.1057,  0.0652]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03573964  0.81947744 -0.04470309 -1.1494144 ]\n",
      "2= tensor([[-0.1142,  0.0718]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05212919  1.0151534  -0.06769138 -1.4557735 ]\n",
      "2= tensor([[-0.1251,  0.0778]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07243226  1.2110379  -0.09680685 -1.7688131 ]\n",
      "2= tensor([[-0.1461,  0.0797]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09665301  1.4071105  -0.1321831  -2.0899618 ]\n",
      "2= tensor([[-0.1736,  0.0790]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12479522  1.6032951  -0.17398234 -2.4204204 ]\n",
      "2= tensor([[-0.2024,  0.0767]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03682542 -0.01214759 -0.0444237  -0.00143571]\n",
      "2= tensor([[-0.0895,  0.0199]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03658247  0.18358238 -0.04445241 -0.30779728]\n",
      "2= tensor([[-0.0986,  0.0427]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04025412  0.3793086  -0.05060836 -0.6141613 ]\n",
      "2= tensor([[-0.1032,  0.0497]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04784029  0.5750998  -0.06289159 -0.9223447 ]\n",
      "2= tensor([[-0.1093,  0.0600]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05934228  0.7710126  -0.08133848 -1.2341107 ]\n",
      "2= tensor([[-0.1171,  0.0651]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07476254  0.9670805  -0.1060207  -1.5511274 ]\n",
      "2= tensor([[-0.1334,  0.0688]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09410415  1.1633024  -0.13704324 -1.8749193 ]\n",
      "2= tensor([[-0.1572,  0.0699]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1173702   1.3596286  -0.17454162 -2.2068121 ]\n",
      "2= tensor([[-0.1861,  0.0687]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02093772 -0.01938792  0.03394543  0.02261141]\n",
      "2= tensor([[-0.0903,  0.0192]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02054996  0.17523119  0.03439765 -0.25917104]\n",
      "2= tensor([[-0.0967,  0.0410]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02405458  0.36984563  0.02921423 -0.5408091 ]\n",
      "2= tensor([[-0.0972,  0.0488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0314515   0.56454504  0.01839805 -0.8241458 ]\n",
      "2= tensor([[-0.1015,  0.0608]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0427424   0.75941056  0.00191513 -1.1109859 ]\n",
      "2= tensor([[-0.1085,  0.0690]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05793061  0.9545073  -0.02030458 -1.4030675 ]\n",
      "2= tensor([[-0.1189,  0.0761]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07702076  1.1498755  -0.04836593 -1.7020284 ]\n",
      "2= tensor([[-0.1365,  0.0799]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10001826  1.3455199  -0.0824065  -2.0093658 ]\n",
      "2= tensor([[-0.1615,  0.0799]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12692866  1.541397   -0.12259382 -2.3263845 ]\n",
      "2= tensor([[-0.1896,  0.0784]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1577566  1.7373993 -0.1691215 -2.654134 ]\n",
      "2= tensor([[-0.2173,  0.0769]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03240529 -0.01374482  0.02538698  0.0386155 ]\n",
      "2= tensor([[-0.0917,  0.0221]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03268019  0.18100406  0.02615929 -0.24595071]\n",
      "2= tensor([[-0.0988,  0.0440]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02906011  0.37574282  0.02124028 -0.53026897]\n",
      "2= tensor([[-0.0987,  0.0526]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02154525  0.18032861  0.0106349  -0.2309696 ]\n",
      "2= tensor([[-0.0989,  0.0438]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01793868  0.37529698  0.00601551 -0.52027905]\n",
      "2= tensor([[-0.0992,  0.0525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01043274  0.5703337  -0.00439007 -0.8110603 ]\n",
      "2= tensor([[-0.1046,  0.0622]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 9.7393669e-04  7.6551557e-01 -2.0611281e-02 -1.1051209e+00]\n",
      "2= tensor([[-0.1102,  0.0709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01628425  0.9609024  -0.0427137  -1.4041982 ]\n",
      "2= tensor([[-0.1206,  0.0776]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0355023   1.156528   -0.07079766 -1.7099229 ]\n",
      "2= tensor([[-0.1402,  0.0804]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05863285  1.3523884  -0.10499612 -2.0237746 ]\n",
      "2= tensor([[-0.1660,  0.0801]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08568062  1.5484288  -0.14547162 -2.347028  ]\n",
      "2= tensor([[-0.1945,  0.0782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1166492   1.7445271  -0.19241217 -2.6806867 ]\n",
      "2= tensor([[-0.2232,  0.0760]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\25036\\AppData\\Local\\Temp\\ipykernel_15580\\1266603837.py:51: UserWarning: Creating a tensor from a list of numpy.ndarrays is extremely slow. Please consider converting the list to a single numpy.ndarray with numpy.array() before converting to a tensor. (Triggered internally at C:\\actions-runner\\_work\\pytorch\\pytorch\\builder\\windows\\pytorch\\torch\\csrc\\utils\\tensor_new.cpp:281.)\n",
      "  state = torch.FloatTensor([i[0] for i in data]).reshape(-1, 4)  # 提取状态并转换为形状为 [64, 4] 的张量\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(207,\n",
       " (array([ 0.00487011,  0.00548145, -0.04611025, -0.01432442], dtype=float32),\n",
       "  1,\n",
       "  1.0,\n",
       "  array([ 0.00497974,  0.20123331, -0.04639674, -0.32119173], dtype=float32),\n",
       "  False))"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 8
  },
  {
   "cell_type": "code",
   "id": "018c4b1e",
   "metadata": {
    "scrolled": true,
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:22.581630Z",
     "start_time": "2024-12-30T06:23:19.148297Z"
    }
   },
   "source": [
    "#训练\n",
    "def train():\n",
    "    # 训练模式\n",
    "    model.train()\n",
    "    '''\n",
    "    定义优化器，这里使用的是 Adam 优化器。\n",
    "    model.parameters()：传入模型的所有可训练参数。\n",
    "    lr=2e-4：学习率为 \n",
    "    0.0002\n",
    "    0.0002，表示每次参数更新的步长。\n",
    "    '''\n",
    "    optimizer = torch.optim.Adam(model.parameters(), lr=2e-4)\n",
    "    # 定义损失函数为 均方误差（MSE），用于计算模型输出的 Q 值和目标 Q 值之间的差异：\n",
    "    loss_fn = torch.nn.MSELoss()\n",
    "\n",
    "    #共更新N轮数据\n",
    "    for epoch in range(5):\n",
    "        pool.update()\n",
    "\n",
    "        #每次更新数据后,训练N次\n",
    "        for i in range(200):\n",
    "            #采样N条数据\n",
    "            state, action, reward, next_state, over = pool.sample()\n",
    "\n",
    "            #计算value\n",
    "            value = model(state).gather(dim=1, index=action)\n",
    "\n",
    "            #计算target\n",
    "            with torch.no_grad():  #禁用梯度计算，用于推理（预测）模型的输出，节省内存和加速。\n",
    "                target = model(next_state)\n",
    "            target = target.max(dim=1)[0].reshape(-1, 1)  #从下一状态的 Q 值中选择最大值\n",
    "            target = target * 0.99 * (1 - over) + reward  #根据 Bellman 方程计算目标 Q 值\n",
    "\n",
    "            loss = loss_fn(value, target)  #计算模型输出的 Q 值（value）与目标 Q 值（target）之间的误差，使用均方误差（MSE）。\n",
    "            loss.backward()  #计算损失函数的梯度，反向传播误差。\n",
    "            optimizer.step()  #使用梯度更新模型的参数。\n",
    "            optimizer.zero_grad()  #清空上一步的梯度，防止梯度累积。\n",
    "        # 每 100 个训练周期，使用模型玩 20 局游戏，计算平均奖励（play() 的返回值的最后一项是总奖励）。\n",
    "        if epoch % 100 == 0:\n",
    "            test_result = sum([play()[-1] for _ in range(20)]) / 20\n",
    "            print(epoch, len(pool), test_result)\n",
    "\n",
    "train()\n"
   ],
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1= [ 0.02555388 -0.0200416   0.01938441  0.02394837]\n",
      "2= tensor([[-0.0900,  0.0189]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02515304  0.17479707  0.01986337 -0.26255608]\n",
      "2= tensor([[-0.0970,  0.0411]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02864899  0.36962995  0.01461225 -0.5489083 ]\n",
      "2= tensor([[-0.0983,  0.0488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03604158  0.5645436   0.00363409 -0.83695173]\n",
      "2= tensor([[-0.1025,  0.0607]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04733246  0.7596157  -0.01310495 -1.1284896 ]\n",
      "2= tensor([[-0.1103,  0.0682]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06252477  0.9549069  -0.03567474 -1.4252539 ]\n",
      "2= tensor([[-0.1205,  0.0750]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08162291  0.76024354 -0.06417982 -1.1439308 ]\n",
      "2= tensor([[-0.1147,  0.0661]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09682778  0.5660161  -0.08705843 -0.87204534]\n",
      "2= tensor([[-0.1088,  0.0594]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10814811  0.76220727 -0.10449934 -1.1907804 ]\n",
      "2= tensor([[-0.1183,  0.0640]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12339225  0.9585164  -0.12831494 -1.5143048 ]\n",
      "2= tensor([[-0.1331,  0.0663]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14256257  1.1549368  -0.15860105 -1.8441343 ]\n",
      "2= tensor([[-0.1567,  0.0679]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1656613   1.3514128  -0.19548373 -2.181583  ]\n",
      "2= tensor([[-0.1858,  0.0667]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01634859  0.04537755 -0.01114015 -0.03181183]\n",
      "2= tensor([[-0.0945,  0.0273]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01544103  0.24065746 -0.01177639 -0.32798865]\n",
      "2= tensor([[-0.0993,  0.0479]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01062788  0.43594506 -0.01833616 -0.62436193]\n",
      "2= tensor([[-0.1027,  0.0536]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00190898  0.63131815 -0.0308234  -0.9227628 ]\n",
      "2= tensor([[-0.1080,  0.0647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01071738  0.82684267 -0.04927866 -1.2249709 ]\n",
      "2= tensor([[-0.1156,  0.0716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02725423  1.0225633  -0.07377808 -1.5326777 ]\n",
      "2= tensor([[-0.1299,  0.0768]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0477055   1.2184927  -0.10443163 -1.8474433 ]\n",
      "2= tensor([[-0.1527,  0.0778]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07207536  1.4145985  -0.1413805  -2.1706464 ]\n",
      "2= tensor([[-0.1808,  0.0767]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10036732  1.6107883  -0.18479343 -2.5034225 ]\n",
      "2= tensor([[-0.2100,  0.0742]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03324316  0.01186443  0.02026501 -0.02629971]\n",
      "2= tensor([[-0.0911,  0.0226]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03348045  0.20668998  0.01973902 -0.31252053]\n",
      "2= tensor([[-0.0967,  0.0427]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03761425  0.40152526  0.01348861 -0.5989136 ]\n",
      "2= tensor([[-0.0990,  0.0490]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04564476  0.59645593  0.00151034 -0.8873175 ]\n",
      "2= tensor([[-0.1034,  0.0619]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05757388  0.7915573  -0.01623601 -1.1795253 ]\n",
      "2= tensor([[-0.1121,  0.0689]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07340502  0.98688626 -0.03982652 -1.4772532 ]\n",
      "2= tensor([[-0.1235,  0.0753]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09314275  1.1824714  -0.06937158 -1.782104  ]\n",
      "2= tensor([[-0.1436,  0.0778]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11679217  1.3783014  -0.10501366 -2.0955215 ]\n",
      "2= tensor([[-0.1702,  0.0773]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1443582  1.5743117 -0.1469241 -2.4187346]\n",
      "2= tensor([[-0.1987,  0.0755]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.17584443  1.7703675  -0.19529878 -2.7526903 ]\n",
      "2= tensor([[-0.2261,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00270915 -0.03002393  0.02423548 -0.0277936 ]\n",
      "2= tensor([[-0.0915,  0.0207]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00210867  0.16474223  0.02367961 -0.31273252]\n",
      "2= tensor([[-0.0976,  0.0417]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00540351  0.35951898  0.01742496 -0.59785455]\n",
      "2= tensor([[-0.0997,  0.0488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01259389  0.5543928   0.00546787 -0.8849983 ]\n",
      "2= tensor([[-0.1036,  0.0596]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02368175  0.74944013 -0.0122321  -1.1759573 ]\n",
      "2= tensor([[-0.1109,  0.0674]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03867055  0.94471884 -0.03575125 -1.4724497 ]\n",
      "2= tensor([[-0.1232,  0.0738]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05756493  1.1402591  -0.06520024 -1.7760813 ]\n",
      "2= tensor([[-0.1432,  0.0764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08037011  1.3360522  -0.10072187 -2.0883021 ]\n",
      "2= tensor([[-0.1695,  0.0761]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10709116  1.5320362  -0.14248791 -2.4103503 ]\n",
      "2= tensor([[-0.1981,  0.0742]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.13773188  1.7280798  -0.19069491 -2.7431855 ]\n",
      "2= tensor([[-0.2272,  0.0716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04627557  0.03582875 -0.03116341  0.01974751]\n",
      "2= tensor([[-0.0940,  0.0270]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.045559    0.23138344 -0.03076846 -0.28260267]\n",
      "2= tensor([[-0.1010,  0.0492]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04093133  0.42693043 -0.03642051 -0.5848288 ]\n",
      "2= tensor([[-0.1040,  0.0560]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03239272  0.6225431  -0.04811709 -0.88875854]\n",
      "2= tensor([[-0.1096,  0.0658]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01994186  0.81828386 -0.06589226 -1.1961708 ]\n",
      "2= tensor([[-0.1163,  0.0726]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00357618  1.014194   -0.08981567 -1.5087566 ]\n",
      "2= tensor([[-0.1304,  0.0775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0167077  1.2102826 -0.1199908 -1.8280741]\n",
      "2= tensor([[-0.1536,  0.0782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04091335  1.4065129  -0.15655228 -2.155496  ]\n",
      "2= tensor([[-0.1820,  0.0770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06904361  1.6027876  -0.19966221 -2.4921463 ]\n",
      "2= tensor([[-0.2119,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00200106 -0.00597205  0.03812237  0.01384568]\n",
      "2= tensor([[-0.0918,  0.0214]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00188162  0.18858303  0.03839929 -0.26656964]\n",
      "2= tensor([[-0.0972,  0.0425]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00565328  0.3831365   0.0330679  -0.5468981 ]\n",
      "2= tensor([[-0.0975,  0.0502]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01331601  0.57777864  0.02212993 -0.8289815 ]\n",
      "2= tensor([[-0.1022,  0.0620]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02487158  0.7725912   0.0055503  -1.1146231 ]\n",
      "2= tensor([[-0.1083,  0.0706]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0403234   0.9676398  -0.01674216 -1.4055598 ]\n",
      "2= tensor([[-0.1187,  0.0776]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0596762   1.1629655  -0.04485335 -1.7034292 ]\n",
      "2= tensor([[-0.1368,  0.0815]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08293551  1.3585742  -0.07892194 -2.0097296 ]\n",
      "2= tensor([[-0.1615,  0.0815]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.110107    1.5544236  -0.11911653 -2.3257682 ]\n",
      "2= tensor([[-0.1895,  0.0800]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14119546  1.360567   -0.16563189 -2.0719814 ]\n",
      "2= tensor([[-0.1752,  0.0734]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1684068   1.55694    -0.20707153 -2.410983  ]\n",
      "2= tensor([[-0.2039,  0.0715]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04327204 -0.01149411  0.01675462 -0.01582917]\n",
      "2= tensor([[-0.0899,  0.0200]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04304215  0.1833836   0.01643804 -0.3031791 ]\n",
      "2= tensor([[-0.0965,  0.0410]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04670982  0.37826747  0.01037446 -0.5906328 ]\n",
      "2= tensor([[-0.0989,  0.0476]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05427517  0.57324266 -0.0014382  -0.8800298 ]\n",
      "2= tensor([[-0.1032,  0.0604]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06574003  0.7683841  -0.01903879 -1.1731645 ]\n",
      "2= tensor([[-0.1119,  0.0671]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08110771  0.9637483  -0.04250208 -1.4717548 ]\n",
      "2= tensor([[-0.1234,  0.0733]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10038268  1.1593634  -0.07193718 -1.7774043 ]\n",
      "2= tensor([[-0.1431,  0.0760]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12356994  1.3552179  -0.10748526 -2.0915575 ]\n",
      "2= tensor([[-0.1699,  0.0756]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.1506743   1.5512466  -0.14931642 -2.4154434 ]\n",
      "2= tensor([[-0.1984,  0.0738]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.18169923  1.7473141  -0.1976253  -2.7500083 ]\n",
      "2= tensor([[-0.2263,  0.0720]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01448254 -0.02557196 -0.03722504 -0.03847663]\n",
      "2= tensor([[-0.0910,  0.0228]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01499398  0.17006348 -0.03799457 -0.34266812]\n",
      "2= tensor([[-0.1001,  0.0446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01159271  0.3657048  -0.04484794 -0.647086  ]\n",
      "2= tensor([[-0.1053,  0.0509]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00427862  0.17123546 -0.05778966 -0.3688562 ]\n",
      "2= tensor([[-0.1002,  0.0443]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00085391  0.36712888 -0.06516678 -0.6791865 ]\n",
      "2= tensor([[-0.1071,  0.0503]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00648867  0.1729698  -0.07875051 -0.40771157]\n",
      "2= tensor([[-0.1004,  0.0441]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00994806  0.3691149  -0.08690474 -0.72414607]\n",
      "2= tensor([[-0.1091,  0.0495]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01733036  0.56532437 -0.10138766 -1.0428674 ]\n",
      "2= tensor([[-0.1136,  0.0569]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02863685  0.7616359  -0.12224501 -1.3655795 ]\n",
      "2= tensor([[-0.1261,  0.0615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04386957  0.958058   -0.1495566  -1.6938646 ]\n",
      "2= tensor([[-0.1465,  0.0631]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06303073  1.1545568  -0.18343389 -2.0291283 ]\n",
      "2= tensor([[-0.1741,  0.0624]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02835963  0.02079705 -0.02057378 -0.02198523]\n",
      "2= tensor([[-0.0937,  0.0259]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02794369 -0.17402391 -0.02101349  0.26413608]\n",
      "2= tensor([[-0.0769, -0.0016]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03142417  0.02139158 -0.01573077 -0.03509993]\n",
      "2= tensor([[-0.0941,  0.0264]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03099634  0.21673554 -0.01643277 -0.33270428]\n",
      "2= tensor([[-0.1000,  0.0474]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02666163  0.41208747 -0.02308685 -0.6305236 ]\n",
      "2= tensor([[-0.1038,  0.0533]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01841988  0.60752386 -0.03569732 -0.930387  ]\n",
      "2= tensor([[-0.1084,  0.0635]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0062694   0.80310893 -0.05430507 -1.2340705 ]\n",
      "2= tensor([[-0.1153,  0.0703]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00979278  0.60872555 -0.07898647 -0.95888305]\n",
      "2= tensor([[-0.1122,  0.0622]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02196729  0.8048155  -0.09816413 -1.2752988 ]\n",
      "2= tensor([[-0.1195,  0.0680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0380636   1.0010427  -0.12367011 -1.5970367 ]\n",
      "2= tensor([[-0.1380,  0.0706]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05808445  1.1973947  -0.15561084 -1.9255816 ]\n",
      "2= tensor([[-0.1638,  0.0707]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08203235  1.3938067  -0.19412248 -2.262205  ]\n",
      "2= tensor([[-0.1931,  0.0689]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0305099  -0.04449748  0.00766382 -0.00376165]\n",
      "2= tensor([[-0.0907,  0.0212]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03139985 -0.2397285   0.00758858  0.2913294 ]\n",
      "2= tensor([[-0.0740, -0.0078]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03619442 -0.04471557  0.01341517  0.00104947]\n",
      "2= tensor([[-0.0909,  0.0213]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03708873  0.15021144  0.01343616 -0.2873708 ]\n",
      "2= tensor([[-0.0993,  0.0430]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0340845   0.34513924  0.00768874 -0.575786  ]\n",
      "2= tensor([[-0.1007,  0.0512]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02718172  0.54015255 -0.00382697 -0.86603683]\n",
      "2= tensor([[-0.1056,  0.0601]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01637867  0.7353264  -0.02114771 -1.1599206 ]\n",
      "2= tensor([[-0.1106,  0.0681]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00167214  0.9307174  -0.04434612 -1.4591585 ]\n",
      "2= tensor([[-0.1236,  0.0745]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01694221  1.1263543  -0.0735293  -1.7653588 ]\n",
      "2= tensor([[-0.1442,  0.0768]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03946929  1.3222263  -0.10883647 -2.079971  ]\n",
      "2= tensor([[-0.1704,  0.0764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06591382  1.5182691  -0.1504359  -2.40423   ]\n",
      "2= tensor([[-0.1993,  0.0743]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0962792  1.7143487 -0.1985205 -2.7390893]\n",
      "2= tensor([[-0.2291,  0.0711]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02964349  0.0307592  -0.01972906 -0.02944218]\n",
      "2= tensor([[-0.0944,  0.0268]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02902831  0.22615844 -0.0203179  -0.32828397]\n",
      "2= tensor([[-0.1001,  0.0479]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02450514  0.42156366 -0.02688358 -0.6273044 ]\n",
      "2= tensor([[-0.1040,  0.0537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01607387  0.61705035 -0.03942967 -0.9283312 ]\n",
      "2= tensor([[-0.1088,  0.0641]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00373286  0.8126818  -0.0579963  -1.2331396 ]\n",
      "2= tensor([[-0.1157,  0.0708]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01252078  1.0084995  -0.08265909 -1.5434138 ]\n",
      "2= tensor([[-0.1314,  0.0756]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03269077  1.2045119  -0.11352737 -1.8607025 ]\n",
      "2= tensor([[-0.1548,  0.0764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.056781    1.4006811  -0.15074141 -2.1863675 ]\n",
      "2= tensor([[-0.1832,  0.0752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08479463  1.5969082  -0.19446877 -2.5215206 ]\n",
      "2= tensor([[-0.2130,  0.0722]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00984151 -0.0165793  -0.00296071  0.03616259]\n",
      "2= tensor([[-0.0907,  0.0209]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0101731   0.17858498 -0.00223745 -0.257453  ]\n",
      "2= tensor([[-0.0990,  0.0436]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0066014   0.3737388  -0.00738651 -0.5508408 ]\n",
      "2= tensor([[-0.1005,  0.0516]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00087338  0.5689637  -0.01840333 -0.8458418 ]\n",
      "2= tensor([[-0.1057,  0.0617]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01225265  0.7643319  -0.03532017 -1.1442547 ]\n",
      "2= tensor([[-0.1123,  0.0692]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02753929  0.959897   -0.05820526 -1.4478014 ]\n",
      "2= tensor([[-0.1240,  0.0752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04673723  0.765537   -0.08716129 -1.1738578 ]\n",
      "2= tensor([[-0.1168,  0.0665]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06204797  0.9616769  -0.11063845 -1.4925438 ]\n",
      "2= tensor([[-0.1309,  0.0705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08128151  1.1579577  -0.14048932 -1.8176261 ]\n",
      "2= tensor([[-0.1538,  0.0719]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10444066  1.354335   -0.17684184 -2.1504579 ]\n",
      "2= tensor([[-0.1826,  0.0707]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01093564  0.0450504   0.02275675 -0.00783466]\n",
      "2= tensor([[-0.0928,  0.0257]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01183665  0.23983872  0.02260005 -0.29325157]\n",
      "2= tensor([[-0.0974,  0.0455]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01663342  0.4346313   0.01673502 -0.57872194]\n",
      "2= tensor([[-0.0985,  0.0521]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02532605  0.62951475  0.00516058 -0.86608636]\n",
      "2= tensor([[-0.1037,  0.0652]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03791634  0.82456607 -0.01216114 -1.1571423 ]\n",
      "2= tensor([[-0.1117,  0.0724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05440767  1.0198444  -0.03530399 -1.4536134 ]\n",
      "2= tensor([[-0.1222,  0.0794]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07480455  1.2153817  -0.06437626 -1.7571137 ]\n",
      "2= tensor([[-0.1422,  0.0818]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09911219  1.4111713  -0.09951853 -2.0691032 ]\n",
      "2= tensor([[-0.1683,  0.0814]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12733561  1.6071545  -0.1409006  -2.3908339 ]\n",
      "2= tensor([[-0.1967,  0.0795]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.15947871  1.8032045  -0.18871728 -2.7232823 ]\n",
      "2= tensor([[-0.2233,  0.0783]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03144624 -0.02537     0.03247642 -0.00362196]\n",
      "2= tensor([[-0.0902,  0.0191]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03093884  0.1692715   0.03240398 -0.28588387]\n",
      "2= tensor([[-0.0964,  0.0403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03432427  0.3639167   0.0266863  -0.5681733 ]\n",
      "2= tensor([[-0.0978,  0.0475]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04160261  0.55865437  0.01532284 -0.8523309 ]\n",
      "2= tensor([[-0.1017,  0.0600]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05277569  0.3633269  -0.00172378 -0.5548694 ]\n",
      "2= tensor([[-0.0987,  0.0477]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06004223  0.558473   -0.01282117 -0.84809494]\n",
      "2= tensor([[-0.1033,  0.0599]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.07121169  0.7537675  -0.02978307 -1.1447818 ]\n",
      "2= tensor([[-0.1120,  0.0663]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08628704  0.94926554 -0.0526787  -1.4466538 ]\n",
      "2= tensor([[-0.1230,  0.0723]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10527235  1.1449944  -0.08161178 -1.7553202 ]\n",
      "2= tensor([[-0.1424,  0.0752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12817223  1.3409412  -0.11671819 -2.0722294 ]\n",
      "2= tensor([[-0.1695,  0.0747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.15499106  1.5370395  -0.15816277 -2.3986127 ]\n",
      "2= tensor([[-0.1980,  0.0730]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.18573186  1.733152   -0.20613503 -2.7354162 ]\n",
      "2= tensor([[-0.2260,  0.0712]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03096331 -0.00253034 -0.01291424 -0.01256521]\n",
      "2= tensor([[-0.0908,  0.0209]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03091271  0.19277442 -0.01316554 -0.3092946 ]\n",
      "2= tensor([[-0.0979,  0.0429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0347682   0.38808146 -0.01935143 -0.6061003 ]\n",
      "2= tensor([[-0.1014,  0.0494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04252983  0.58346856 -0.03147344 -0.9048151 ]\n",
      "2= tensor([[-0.1065,  0.0608]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0541992   0.7790023  -0.04956974 -1.2072221 ]\n",
      "2= tensor([[-0.1149,  0.0670]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06977924  0.9747284  -0.07371418 -1.5150181 ]\n",
      "2= tensor([[-0.1286,  0.0720]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08927381  1.170661   -0.10401455 -1.8297713 ]\n",
      "2= tensor([[-0.1503,  0.0738]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11268703  1.3667701  -0.14060996 -2.1528702 ]\n",
      "2= tensor([[-0.1784,  0.0729]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14002243  1.5629665  -0.18366738 -2.4854636 ]\n",
      "2= tensor([[-0.2073,  0.0708]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02665072  0.00212866  0.00149717  0.03607342]\n",
      "2= tensor([[-0.0922,  0.0230]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02660815  0.1972291   0.00221863 -0.25613678]\n",
      "2= tensor([[-0.0994,  0.0453]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02266357  0.39231932 -0.0029041  -0.54811907]\n",
      "2= tensor([[-0.1005,  0.0532]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01481718  0.5874819  -0.01386648 -0.8417156 ]\n",
      "2= tensor([[-0.1060,  0.0634]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00306754  0.7827904  -0.0307008  -1.1387267 ]\n",
      "2= tensor([[-0.1121,  0.0713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01258827  0.97830003 -0.05347533 -1.4408777 ]\n",
      "2= tensor([[-0.1234,  0.0776]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03215427  1.1740383  -0.08229288 -1.7497795 ]\n",
      "2= tensor([[-0.1441,  0.0798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05563504  1.3699927  -0.11728847 -2.0668833 ]\n",
      "2= tensor([[-0.1706,  0.0793]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08303489  1.5660971  -0.15862614 -2.3934228 ]\n",
      "2= tensor([[-0.1995,  0.0771]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11435683  1.7622151  -0.20649458 -2.7303472 ]\n",
      "2= tensor([[-0.2284,  0.0746]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03435815  0.02738554 -0.01714526 -0.04456913]\n",
      "2= tensor([[-0.0921,  0.0244]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03490586  0.2227491  -0.01803664 -0.34261185]\n",
      "2= tensor([[-0.0977,  0.0443]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03936084  0.41812295 -0.02488887 -0.64092743]\n",
      "2= tensor([[-0.1015,  0.0507]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0477233   0.61358285 -0.03770743 -0.94134307]\n",
      "2= tensor([[-0.1075,  0.0621]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05999496  0.8091922  -0.05653429 -1.2456318 ]\n",
      "2= tensor([[-0.1165,  0.0679]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0761788   1.0049919  -0.08144692 -1.5554744 ]\n",
      "2= tensor([[-0.1313,  0.0725]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.09627864  1.2009897  -0.11255641 -1.8724155 ]\n",
      "2= tensor([[-0.1544,  0.0737]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.12029844  1.397147   -0.15000473 -2.1978114 ]\n",
      "2= tensor([[-0.1828,  0.0726]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.14824139  1.5933633  -0.19396095 -2.5327668 ]\n",
      "2= tensor([[-0.2117,  0.0705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02760312  0.00123947 -0.010056    0.03073216]\n",
      "2= tensor([[-0.0920,  0.0232]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02757833  0.19650418 -0.00944136 -0.2651065 ]\n",
      "2= tensor([[-0.0998,  0.0457]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02364825  0.3917596  -0.01474349 -0.56075233]\n",
      "2= tensor([[-0.1016,  0.0534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01581306  0.5870853  -0.02595854 -0.8580435 ]\n",
      "2= tensor([[-0.1070,  0.0633]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00407135  0.7825511  -0.0431194  -1.1587744 ]\n",
      "2= tensor([[-0.1135,  0.0706]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01157967  0.97820765 -0.06629489 -1.4646595 ]\n",
      "2= tensor([[-0.1258,  0.0764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03114382  1.1740761  -0.09558808 -1.7772931 ]\n",
      "2= tensor([[-0.1472,  0.0782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05462534  1.3701357  -0.13113394 -2.0981002 ]\n",
      "2= tensor([[-0.1745,  0.0775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08202806  1.5663098  -0.17309594 -2.428278  ]\n",
      "2= tensor([[-0.2036,  0.0751]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01134786 -0.02601242  0.04657099 -0.03764451]\n",
      "2= tensor([[-0.0918,  0.0209]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01082761  0.16841184  0.0458181  -0.31527776]\n",
      "2= tensor([[-0.0966,  0.0409]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01419585  0.3628522   0.03951254 -0.5931664 ]\n",
      "2= tensor([[-0.0980,  0.0479]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02145289  0.5573994   0.02764922 -0.8731458 ]\n",
      "2= tensor([[-0.1016,  0.0597]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03260088  0.75213474  0.0101863  -1.1570092 ]\n",
      "2= tensor([[-0.1087,  0.0680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04764357  0.9471224  -0.01295388 -1.4464809 ]\n",
      "2= tensor([[-0.1196,  0.0754]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06658603  1.1424013  -0.0418835  -1.743183  ]\n",
      "2= tensor([[-0.1387,  0.0785]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08943405  0.94778013 -0.07674716 -1.4638175 ]\n",
      "2= tensor([[-0.1260,  0.0706]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.10838965  1.1437539  -0.10602351 -1.7794542 ]\n",
      "2= tensor([[-0.1465,  0.0731]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.13126473  1.3398973  -0.14161259 -2.1031299 ]\n",
      "2= tensor([[-0.1745,  0.0722]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.15806267  1.536128   -0.1836752  -2.4360247 ]\n",
      "2= tensor([[-0.2033,  0.0704]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00092305 -0.04620118  0.01614219 -0.04599606]\n",
      "2= tensor([[-0.0907,  0.0203]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-9.7370264e-07  1.4868563e-01  1.5222272e-02 -3.3354259e-01]\n",
      "2= tensor([[-0.0979,  0.0412]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00297274  0.34358764  0.00855142 -0.6213866 ]\n",
      "2= tensor([[-0.1009,  0.0481]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00984449  0.14834733 -0.00387631 -0.3260227 ]\n",
      "2= tensor([[-0.0982,  0.0412]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01281144  0.34352425 -0.01039677 -0.61992556]\n",
      "2= tensor([[-0.1019,  0.0481]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01968192  0.53878987 -0.02279528 -0.9158647 ]\n",
      "2= tensor([[-0.1060,  0.0578]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03045772  0.7342125  -0.04111257 -1.2156237 ]\n",
      "2= tensor([[-0.1130,  0.0647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04514197  0.92984    -0.06542505 -1.5209007 ]\n",
      "2= tensor([[-0.1284,  0.0698]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06373877  1.1256888  -0.09584306 -1.8332666 ]\n",
      "2= tensor([[-0.1496,  0.0718]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.08625255  1.3217317  -0.1325084  -2.1541162 ]\n",
      "2= tensor([[-0.1776,  0.0710]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.11268718  1.5178832  -0.17559071 -2.4846077 ]\n",
      "2= tensor([[-0.2072,  0.0683]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03711552  0.01661487 -0.04925909 -0.02343822]\n",
      "2= tensor([[-0.1228, -0.2134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03744782 -0.1777673  -0.04972785  0.25330508]\n",
      "2= tensor([[0.0159, 0.1350]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03389247  0.01802812 -0.04466175 -0.05463899]\n",
      "2= tensor([[-0.1329, -0.2460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03425303  0.21376106 -0.04575453 -0.36107183]\n",
      "2= tensor([[-0.2823, -0.7049]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03852826  0.01931833 -0.05297597 -0.08316009]\n",
      "2= tensor([[-0.1447, -0.2805]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03891462 -0.17500578 -0.05463917  0.1923495 ]\n",
      "2= tensor([[-0.0021,  0.0920]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03541451  0.0208535  -0.05079218 -0.11705693]\n",
      "2= tensor([[-0.1559, -0.3167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03583157 -0.17350529 -0.05313332  0.1591788 ]\n",
      "2= tensor([[-0.0127,  0.0668]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03236147  0.02233551 -0.04994974 -0.14978167]\n",
      "2= tensor([[-0.1669, -0.3525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03280818 -0.17203692 -0.05294538  0.12673421]\n",
      "2= tensor([[-0.0229,  0.0417]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02936744  0.02380197 -0.05041069 -0.18217115]\n",
      "2= tensor([[-0.1780, -0.3880]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02984348 -0.17056377 -0.05405411  0.09419261]\n",
      "2= tensor([[-0.0333,  0.0157]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0264322   0.02528959 -0.05217027 -0.21504252]\n",
      "2= tensor([[-0.1893, -0.4240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.026938   -0.1690492  -0.05647111  0.06073796]\n",
      "2= tensor([[-0.0458, -0.0155]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02355701  0.02683504 -0.05525636 -0.24921371]\n",
      "2= tensor([[-0.2013, -0.4615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02409371 -0.16745605 -0.06024063  0.02554101]\n",
      "2= tensor([[-0.0585, -0.0505]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02074459  0.02847575 -0.05972981 -0.28552362]\n",
      "2= tensor([[-0.2141, -0.5015]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02131411 -0.16574574 -0.06544028 -0.01226105]\n",
      "2= tensor([[-0.0723, -0.0898]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01799919 -0.35987112 -0.0656855   0.25907806]\n",
      "2= tensor([[0.0552, 0.2037]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01080177 -0.55399686 -0.06050394  0.530341  ]\n",
      "2= tensor([[0.1221, 0.3354]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-2.7816551e-04 -3.5807830e-01 -4.9897119e-02  2.1922365e-01]\n",
      "2= tensor([[0.0474, 0.1880]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00743973 -0.16227992 -0.04551265 -0.08877205]\n",
      "2= tensor([[-0.0934, -0.1589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01068533 -0.35672095 -0.04728809  0.18921138]\n",
      "2= tensor([[0.0394, 0.1722]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01781975 -0.16095549 -0.04350386 -0.11800607]\n",
      "2= tensor([[-0.1020, -0.1858]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02103886 -0.355428   -0.04586398  0.16064058]\n",
      "2= tensor([[0.0316, 0.1566]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02814742 -0.15968047 -0.04265117 -0.14615121]\n",
      "2= tensor([[-0.1105, -0.2124]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03134103 -0.3541665  -0.0455742   0.13277687]\n",
      "2= tensor([[0.0239, 0.1405]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03842436 -0.15842237 -0.04291866 -0.17392863]\n",
      "2= tensor([[-0.1193, -0.2397]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04159281 -0.35290462 -0.04639723  0.1049119 ]\n",
      "2= tensor([[0.0163, 0.1243]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0486509  -0.15714954 -0.04429899 -0.20204063]\n",
      "2= tensor([[-0.1285, -0.2695]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05179389 -0.35161087 -0.04833981  0.07634556]\n",
      "2= tensor([[0.0084, 0.1076]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05882611 -0.15583046 -0.0468129  -0.23118839]\n",
      "2= tensor([[-0.1380, -0.3006]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06194272 -0.3502533  -0.05143666  0.04636844]\n",
      "2= tensor([[8.5607e-05, 8.9762e-02]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06894778 -0.15443297 -0.05050929 -0.2620893 ]\n",
      "2= tensor([[-0.1476, -0.3328]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07203644 -0.3487989  -0.05575108  0.01424436]\n",
      "2= tensor([[-0.0089,  0.0698]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07901242 -0.15292357 -0.05546619 -0.29549447]\n",
      "2= tensor([[-0.1583, -0.3680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08207089 -0.3472127  -0.06137608 -0.02080764]\n",
      "2= tensor([[-0.0183,  0.0453]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08901514 -0.15126671 -0.06179224 -0.33220646]\n",
      "2= tensor([[-0.1706, -0.4077]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09204048 -0.3454572  -0.06843636 -0.05963202]\n",
      "2= tensor([[-0.0283,  0.0118]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09894963 -0.14942414 -0.06962901 -0.37309787]\n",
      "2= tensor([[-0.1868, -0.4560]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10193811 -0.34349144 -0.07709096 -0.10315666]\n",
      "2= tensor([[-0.0419, -0.0318]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10880794 -0.1473542  -0.0791541  -0.41913104]\n",
      "2= tensor([[-0.2076, -0.5154]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11175502 -0.34127054 -0.08753671 -0.15241428]\n",
      "2= tensor([[-0.0592, -0.0835]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11858043 -0.5350371  -0.090585    0.11141977]\n",
      "2= tensor([[0.0523, 0.1933]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12928118 -0.33874175 -0.08835661 -0.20841162]\n",
      "2= tensor([[-0.0794, -0.1437]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.136056   -0.53249645 -0.09252483  0.05514368]\n",
      "2= tensor([[0.0381, 0.1626]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.14670594 -0.33617803 -0.09142196 -0.2652379 ]\n",
      "2= tensor([[-0.1033, -0.2133]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1534295  -0.5298843  -0.09672672 -0.00273254]\n",
      "2= tensor([[0.0228, 0.1291]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.16402718 -0.3335178  -0.09678137 -0.3242988 ]\n",
      "2= tensor([[-0.1286, -0.2869]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.17069754 -0.13716057 -0.10326735 -0.6458656 ]\n",
      "2= tensor([[-0.3110, -0.8092]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.17344075 -0.3307035  -0.11618466 -0.3874045 ]\n",
      "2= tensor([[-0.1576, -0.3705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18005481 -0.52400106 -0.12393275 -0.13349444]\n",
      "2= tensor([[-0.0194,  0.0267]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.19053484 -0.32734188 -0.12660263 -0.46256366]\n",
      "2= tensor([[-0.1918, -0.4695]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.19708169 -0.5204686  -0.13585392 -0.21231396]\n",
      "2= tensor([[-0.0514, -0.0563]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.20749106 -0.71341306 -0.1401002   0.03461778]\n",
      "2= tensor([[0.0614, 0.1930]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.2217593  -0.51658905 -0.13940783 -0.29878035]\n",
      "2= tensor([[-0.0860, -0.1613]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.2320911  -0.70947707 -0.14538345 -0.05310856]\n",
      "2= tensor([[0.0340, 0.1378]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.24628064 -0.5126021  -0.14644562 -0.3878979 ]\n",
      "2= tensor([[-0.1256, -0.2770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.25653267 -0.7053748  -0.15420358 -0.14473534]\n",
      "2= tensor([[-0.0004,  0.0669]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.27064016 -0.50841933 -0.15709828 -0.48181933]\n",
      "2= tensor([[-0.1688, -0.4021]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.28080857 -0.70101565 -0.16673467 -0.24247965]\n",
      "2= tensor([[-0.0406, -0.0240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.29482886 -0.5039532  -0.17158426 -0.5827671 ]\n",
      "2= tensor([[-0.2195, -0.5435]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.30490795 -0.6963087  -0.1832396  -0.34866956]\n",
      "2= tensor([[-0.0848, -0.1469]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.3188341  -0.88841605 -0.190213   -0.11890423]\n",
      "2= tensor([[0.0368, 0.1266]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.33660242 -0.69115007 -0.19259107 -0.46505237]\n",
      "2= tensor([[-0.1394, -0.3001]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.35042542 -0.8831036  -0.20189212 -0.23871782]\n",
      "2= tensor([[-0.0150,  0.0244]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.3680875  -0.685756   -0.20666648 -0.5876805 ]\n",
      "2= tensor([[-0.1982, -0.4650]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00526232  0.00632916 -0.00543868  0.02232659]\n",
      "2= tensor([[-0.0962, -0.1427]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0053889  -0.18871437 -0.00499215  0.3132886 ]\n",
      "2= tensor([[0.0381, 0.1871]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00161462 0.00647834 0.00127362 0.0190355 ]\n",
      "2= tensor([[-0.0962, -0.1444]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00174418 -0.18866186  0.00165433  0.31212   ]\n",
      "2= tensor([[0.0382, 0.1877]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00202905  0.00643649  0.00789673  0.01995925]\n",
      "2= tensor([[-0.0947, -0.1416]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00190032 -0.18879782  0.00829591  0.3151232 ]\n",
      "2= tensor([[0.0394, 0.1905]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00567628  0.00620499  0.01459838  0.02506802]\n",
      "2= tensor([[-0.0920, -0.1347]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00555218 -0.18912324  0.01509974  0.3223209 ]\n",
      "2= tensor([[0.0416, 0.1958]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00933464  0.00578047  0.02154616  0.03443783]\n",
      "2= tensor([[-0.0878, -0.1233]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00921904 -0.18964373  0.02223491  0.33384016]\n",
      "2= tensor([[0.0450, 0.2034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01301191  0.00515482  0.02891172  0.0482511 ]\n",
      "2= tensor([[-0.0822, -0.1073]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01290881 -0.19036952  0.02987674  0.3499139 ]\n",
      "2= tensor([[0.0494, 0.2136]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0167162   0.00431507  0.03687502  0.06679979]\n",
      "2= tensor([[-0.0750, -0.0864]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0166299  -0.19131562  0.03821101  0.37088513]\n",
      "2= tensor([[0.0550, 0.2254]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02045622  0.00324321  0.04562872  0.09049123]\n",
      "2= tensor([[-0.0662, -0.0602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02039135  0.19768244  0.04743854 -0.18745388]\n",
      "2= tensor([[-0.2067, -0.4829]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0164377   0.00191501  0.04368946  0.11980861]\n",
      "2= tensor([[-0.0575, -0.0324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0163994   0.19638465  0.04608563 -0.1587769 ]\n",
      "2= tensor([[-0.1972, -0.4520]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01247171  0.00063424  0.0429101   0.14808136]\n",
      "2= tensor([[-0.0492, -0.0066]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01245902  0.19511628  0.04587172 -0.13076147]\n",
      "2= tensor([[-0.1878, -0.4218]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0085567  -0.00063173  0.04325649  0.17603323]\n",
      "2= tensor([[-0.0406,  0.0149]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00856933  0.19384533  0.04677716 -0.10269604]\n",
      "2= tensor([[-0.1783, -0.3916]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00469243 -0.00191469  0.04472324  0.20437026]\n",
      "2= tensor([[-0.0313,  0.0366]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00473072  0.1925401   0.04881064 -0.07387602]\n",
      "2= tensor([[-0.1679, -0.3598]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00087992 -0.00324639  0.04733312  0.23379858]\n",
      "2= tensor([[-0.0216,  0.0592]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00094485  0.19116843  0.05200909 -0.04358628]\n",
      "2= tensor([[-0.1563, -0.3259]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00287852 -0.00465925  0.05113737  0.26504183]\n",
      "2= tensor([[-0.0112,  0.0833]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00278534  0.18969694  0.0564382  -0.01108352]\n",
      "2= tensor([[-0.1443, -0.2906]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00657928 -0.00618709  0.05621653  0.2988587 ]\n",
      "2= tensor([[0.0003, 0.1090]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00645553 0.18809035 0.06219371 0.02442187]\n",
      "2= tensor([[-0.1317, -0.2537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01021734 -0.00786582  0.06268214  0.336061  ]\n",
      "2= tensor([[0.0110, 0.1355]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01006003 0.18631068 0.06940337 0.06378474]\n",
      "2= tensor([[-0.1176, -0.2126]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01378624 -0.00973417  0.07067906  0.37753227]\n",
      "2= tensor([[0.0226, 0.1647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01359155 0.18431652 0.0782297  0.10794532]\n",
      "2= tensor([[-0.1021, -0.1662]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01727789 -0.01183424  0.08038861  0.42424768]\n",
      "2= tensor([[0.0348, 0.1920]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0170412  0.18206239 0.08887357 0.1579508 ]\n",
      "2= tensor([[-0.0848, -0.1143]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02068245 -0.01421214  0.09203258  0.4772951 ]\n",
      "2= tensor([[0.0468, 0.2177]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02039821 0.17949809 0.10157848 0.21497884]\n",
      "2= tensor([[-0.0649, -0.0581]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02398817  0.3730322   0.10587806 -0.04401319]\n",
      "2= tensor([[-0.1982, -0.4526]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03144881 0.17656389 0.1049978  0.28010902]\n",
      "2= tensor([[-0.0434, -0.0065]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03498009 0.37004358 0.11059998 0.02230045]\n",
      "2= tensor([[-0.1756, -0.3825]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04238096 0.1735236  0.11104599 0.34772947]\n",
      "2= tensor([[-0.0230,  0.0443]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04585143 0.36690536 0.11800057 0.09202394]\n",
      "2= tensor([[-0.1521, -0.3109]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05318954 0.17030711 0.11984105 0.4194823 ]\n",
      "2= tensor([[0.0008, 0.0995]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05659568 0.3635452  0.1282307  0.16685311]\n",
      "2= tensor([[-0.1267, -0.2340]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06386659 0.16684318 0.13156776 0.4970803 ]\n",
      "2= tensor([[0.0225, 0.1534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06720345 0.35988846 0.14150937 0.24858437]\n",
      "2= tensor([[-0.0973, -0.1495]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07440122 0.16305904 0.14648105 0.5823424 ]\n",
      "2= tensor([[0.0369, 0.1971]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0776624  0.3558579  0.1581279  0.33915272]\n",
      "2= tensor([[-0.0613, -0.0684]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08477956 0.15888086 0.16491096 0.67722815]\n",
      "2= tensor([[0.0531, 0.2374]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08795717 0.35137427 0.17845552 0.44066975]\n",
      "2= tensor([[-0.0229,  0.0141]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09498466 0.54358137 0.18726891 0.20912562]\n",
      "2= tensor([[-0.1566, -0.3233]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10585628 0.34634423 0.19145143 0.5545445 ]\n",
      "2= tensor([[0.0112, 0.0940]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11278317 0.5383355  0.20254232 0.32776284]\n",
      "2= tensor([[-0.1093, -0.2027]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12354989 0.34099302 0.20909758 0.67686677]\n",
      "2= tensor([[0.0353, 0.1544]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02713693 -0.04538301  0.00979887  0.01121929]\n",
      "2= tensor([[-0.0813, -0.1100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02804459 -0.24064411  0.01002326  0.3069777 ]\n",
      "2= tensor([[0.0491, 0.2090]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03285747 -0.0456664   0.01616281  0.01747262]\n",
      "2= tensor([[-0.0781, -0.1011]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0337708  -0.24101637  0.01651226  0.31521097]\n",
      "2= tensor([[0.0517, 0.2151]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03859112 -0.04613348  0.02281648  0.02778086]\n",
      "2= tensor([[-0.0736, -0.0880]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03951379 -0.24157508  0.0233721   0.3275744 ]\n",
      "2= tensor([[0.0551, 0.2226]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0443453  -0.04679353  0.02992359  0.04235266]\n",
      "2= tensor([[-0.0676, -0.0705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04528117 -0.24233152  0.03077064  0.34432456]\n",
      "2= tensor([[0.0593, 0.2318]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0501278  -0.0476605   0.03765713  0.06150141]\n",
      "2= tensor([[-0.0601, -0.0483]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05108101  0.14690186  0.03888716 -0.21906665]\n",
      "2= tensor([[-0.2033, -0.4738]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04814297 -0.04875377  0.03450583  0.08562486]\n",
      "2= tensor([[-0.0527, -0.0251]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04911805  0.145857    0.03621833 -0.19597484]\n",
      "2= tensor([[-0.1956, -0.4483]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0462009  -0.04976379  0.03229883  0.10790978]\n",
      "2= tensor([[-0.0459, -0.0041]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04719618  0.14488079  0.03445702 -0.1744106 ]\n",
      "2= tensor([[-0.1884, -0.4245]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04429857 -0.05071693  0.03096881  0.12894018]\n",
      "2= tensor([[-0.0400,  0.0136]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0453129   0.14394802  0.03354762 -0.15381385]\n",
      "2= tensor([[-0.1814, -0.4019]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04243394 -0.05163782  0.03047134  0.14926098]\n",
      "2= tensor([[-0.0335,  0.0293]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0434667   0.14303483  0.03345656 -0.13365526]\n",
      "2= tensor([[-0.1745, -0.3798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.040606   -0.05254998  0.03078345  0.16939217]\n",
      "2= tensor([[-0.0271,  0.0449]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.041657    0.14211814  0.0341713  -0.11342276]\n",
      "2= tensor([[-0.1676, -0.3576]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03881464 -0.05347636  0.03190284  0.18984212]\n",
      "2= tensor([[-0.0205,  0.0608]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03988417  0.141175    0.03569968 -0.0926085 ]\n",
      "2= tensor([[-0.1598, -0.3339]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03706067 -0.05443997  0.03384751  0.21112047]\n",
      "2= tensor([[-0.0138,  0.0777]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03814946  0.1401821   0.03806992 -0.07069614]\n",
      "2= tensor([[-0.1514, -0.3088]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03534583 -0.05546439  0.036656    0.23375079]\n",
      "2= tensor([[-0.0075,  0.0946]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03645511  0.13911517  0.04133102 -0.04714802]\n",
      "2= tensor([[-0.1426, -0.2822]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03367281 -0.05657433  0.04038806  0.2582834 ]\n",
      "2= tensor([[-0.0005,  0.1129]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0348043   0.13794845  0.04555373 -0.02139197]\n",
      "2= tensor([[-0.1331, -0.2537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03204533 -0.05779618  0.04512588  0.28530854]\n",
      "2= tensor([[0.0074, 0.1328]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03320125  0.13665411  0.05083206  0.00719255]\n",
      "2= tensor([[-0.1228, -0.2230]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03046817 -0.0591586   0.05097591  0.31547043]\n",
      "2= tensor([[0.0161, 0.1543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03165134  0.13520157  0.05728532  0.03928929]\n",
      "2= tensor([[-0.1112, -0.1888]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02894731 -0.06069307  0.0580711   0.3494819 ]\n",
      "2= tensor([[0.0266, 0.1764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03016117  0.13355696  0.06506074  0.07566133]\n",
      "2= tensor([[-0.0979, -0.1501]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02749003 -0.06243443  0.06657396  0.38814083]\n",
      "2= tensor([[0.0371, 0.1983]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02873872 -0.2584351   0.07433678  0.7010488 ]\n",
      "2= tensor([[0.1020, 0.3426]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03390742 -0.06441801  0.08835775  0.4326618 ]\n",
      "2= tensor([[0.0489, 0.2240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03519578  0.12934907  0.09701099  0.16908842]\n",
      "2= tensor([[-0.0632, -0.0507]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0326088   0.32295823  0.10039276 -0.09148335]\n",
      "2= tensor([[-0.1959, -0.4479]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02614964  0.12655134  0.0985631   0.23110951]\n",
      "2= tensor([[-0.0439,  0.0002]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02361861  0.32013685  0.10318529 -0.02892877]\n",
      "2= tensor([[-0.1764, -0.3849]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01721587  0.51363933  0.10260671 -0.287356  ]\n",
      "2= tensor([[-0.3028, -0.7743]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00694308  0.3172152   0.09685959  0.03584407]\n",
      "2= tensor([[-0.1553, -0.3179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00059878  0.12084731  0.09757647  0.35744748]\n",
      "2= tensor([[-0.0062,  0.0948]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00181817 0.31445643 0.10472542 0.09705722]\n",
      "2= tensor([[-0.1344, -0.2545]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00810729 0.11800155 0.10666656 0.4208581 ]\n",
      "2= tensor([[0.0116, 0.1396]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01046732 0.31146327 0.11508372 0.16361535]\n",
      "2= tensor([[-0.1116, -0.1857]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01669659 0.11489803 0.11835603 0.49027282]\n",
      "2= tensor([[0.0290, 0.1834]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01899455 0.30816892 0.12816149 0.23711015]\n",
      "2= tensor([[-0.0860, -0.1110]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02515793 0.11147112 0.1329037  0.56731343]\n",
      "2= tensor([[0.0426, 0.2192]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02738735 0.304503   0.14424996 0.31927782]\n",
      "2= tensor([[-0.0539, -0.0393]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03347741 0.49730754 0.15063553 0.07533727]\n",
      "2= tensor([[-0.1888, -0.4083]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04342356 0.30038312 0.15214227 0.41149846]\n",
      "2= tensor([[-0.0236,  0.0310]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04943122 0.49305785 0.16037223 0.1703823 ]\n",
      "2= tensor([[-0.1567, -0.3127]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05929238  0.6855644   0.16377988 -0.06772455]\n",
      "2= tensor([[-0.2818, -0.6824]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07300367 0.4885194  0.16242538 0.27182397]\n",
      "2= tensor([[-0.1210, -0.2115]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08277406 0.68099606 0.16786186 0.03445244]\n",
      "2= tensor([[-0.2497, -0.5845]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09639398 0.48391443 0.16855092 0.37503964]\n",
      "2= tensor([[-0.0783, -0.1181]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10607227 0.28684953 0.1760517  0.71576774]\n",
      "2= tensor([[0.0449, 0.1983]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11180926 0.4791544  0.19036706 0.48326138]\n",
      "2= tensor([[-0.0357, -0.0299]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.12139235 0.6711518  0.2000323  0.25609845]\n",
      "2= tensor([[-0.1712, -0.3650]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.13481538 0.4738198  0.20515426 0.6046124 ]\n",
      "2= tensor([[0.0011, 0.0541]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04460781  0.00907355  0.02845639 -0.00937824]\n",
      "2= tensor([[-0.0985, -0.1558]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04442634 -0.1864447   0.02826882  0.29214546]\n",
      "2= tensor([[0.0360, 0.1878]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04815523  0.00826302  0.03411173  0.00851049]\n",
      "2= tensor([[-0.0916, -0.1354]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04798997 -0.18733111  0.03428194  0.31175792]\n",
      "2= tensor([[0.0414, 0.2000]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05173659  0.00728609  0.0405171   0.03008055]\n",
      "2= tensor([[-0.0835, -0.1114]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05159087 -0.18839277  0.04111871  0.3352667 ]\n",
      "2= tensor([[0.0479, 0.2144]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05535873  0.0061206   0.04782404  0.05582878]\n",
      "2= tensor([[-0.0741, -0.0831]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05523631 -0.18965329  0.04894062  0.36320877]\n",
      "2= tensor([[0.0553, 0.2299]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05902938  0.00474016  0.0562048   0.08635053]\n",
      "2= tensor([[-0.0630, -0.0499]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05893458  0.1990133   0.05793181 -0.18808351]\n",
      "2= tensor([[-0.2017, -0.4674]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05495431  0.00311243  0.05417014  0.12229726]\n",
      "2= tensor([[-0.0521, -0.0162]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05489206  0.19741812  0.05661608 -0.15281554]\n",
      "2= tensor([[-0.1905, -0.4303]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0509437   0.00153314  0.05355977  0.1571774 ]\n",
      "2= tensor([[-0.0423,  0.0134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05091304  0.19584897  0.05670332 -0.11813934]\n",
      "2= tensor([[-0.1787, -0.3926]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-4.6996057e-02 -3.7638212e-05  5.4340530e-02  1.9188017e-01]\n",
      "2= tensor([[-0.0313,  0.0402]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04699681  0.19426653  0.05817813 -0.08317762]\n",
      "2= tensor([[-0.1663, -0.3538]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04311148 -0.00163904  0.05651458  0.22727829]\n",
      "2= tensor([[-0.0196,  0.0675]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04314426  0.19263163  0.06106015 -0.04705603]\n",
      "2= tensor([[-0.1534, -0.3144]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03929163 -0.00331032  0.06011903  0.26424968]\n",
      "2= tensor([[-0.0078,  0.0956]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03935783  0.1909043   0.06540402 -0.00888159]\n",
      "2= tensor([[-0.1395, -0.2729]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03553975  0.38503027  0.06522639 -0.28023288]\n",
      "2= tensor([[-0.2723, -0.6823]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02783914  0.18904145  0.05962173  0.03228817]\n",
      "2= tensor([[-0.1264, -0.2317]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02405831 -0.00688258  0.06026749  0.34317043]\n",
      "2= tensor([[0.0141, 0.1494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02419597  0.1873325   0.0671309   0.07008462]\n",
      "2= tensor([[-0.1128, -0.1924]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02044932 -0.00868445  0.06853259  0.38316944]\n",
      "2= tensor([[0.0255, 0.1763]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02062301  0.18540093  0.07619599  0.1128576 ]\n",
      "2= tensor([[-0.0976, -0.1475]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01691499 -0.01072546  0.07845314  0.42857352]\n",
      "2= tensor([[0.0374, 0.2015]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0171295   0.18320286  0.08702461  0.16161737]\n",
      "2= tensor([[-0.0810, -0.0977]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01346544 -0.01305017  0.09025695  0.48043585]\n",
      "2= tensor([[0.0483, 0.2248]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01372644  0.18068951  0.09986567  0.21750876]\n",
      "2= tensor([[-0.0612, -0.0443]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01011265 -0.01570771  0.10421585  0.5399485 ]\n",
      "2= tensor([[0.0585, 0.2486]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01042681  0.1778068   0.11501482  0.28183568]\n",
      "2= tensor([[-0.0398,  0.0084]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00687067  0.37111637  0.12065153  0.02752694]\n",
      "2= tensor([[-0.1698, -0.3620]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00055166 0.17448935 0.12120207 0.35570893]\n",
      "2= tensor([[-0.0168,  0.0651]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00404144 0.36769834 0.12831625 0.10356776]\n",
      "2= tensor([[-0.1436, -0.2821]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01139541 0.1709933  0.1303876  0.4338211 ]\n",
      "2= tensor([[0.0073, 0.1236]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01481528 0.3640515  0.13906403 0.18491739]\n",
      "2= tensor([[-0.1158, -0.1980]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02209631 0.1672421  0.14276238 0.5180347 ]\n",
      "2= tensor([[0.0269, 0.1762]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02544115 0.36009592 0.15312307 0.2735266 ]\n",
      "2= tensor([[-0.0826, -0.1089]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03264306 0.1631585  0.1585936  0.61031884]\n",
      "2= tensor([[0.0424, 0.2202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03590624 0.35574985 0.17079997 0.37148854]\n",
      "2= tensor([[-0.0449, -0.0258]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04302123 0.5480859  0.17822975 0.13715377]\n",
      "2= tensor([[-0.1792, -0.3793]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05398295 0.3509184  0.18097283 0.4803427 ]\n",
      "2= tensor([[-0.0089,  0.0549]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06100132 0.54308623 0.19057968 0.2497144 ]\n",
      "2= tensor([[-0.1382, -0.2655]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07186305 0.34582624 0.19557397 0.59593904]\n",
      "2= tensor([[0.0204, 0.1280]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07877957 0.5377514  0.20749274 0.3706725 ]\n",
      "2= tensor([[-0.0874, -0.1469]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02790669  0.04037313 -0.01463467  0.03743737]\n",
      "2= tensor([[-0.1027, -0.1575]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02871415 -0.15453593 -0.01388592  0.32546723]\n",
      "2= tensor([[0.0331, 0.1768]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02562343  0.04078094 -0.00737658  0.02843782]\n",
      "2= tensor([[-0.1048, -0.1660]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02643905 -0.15423445 -0.00680782  0.31878427]\n",
      "2= tensor([[0.0316, 0.1737]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02335436  0.04098379 -0.00043214  0.02396219]\n",
      "2= tensor([[-0.1052, -0.1696]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 2.4174036e-02 -1.5413196e-01  4.7107493e-05  3.1650874e-01]\n",
      "2= tensor([[0.0314, 0.1733]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0210914  0.04098932 0.00637728 0.02384067]\n",
      "2= tensor([[-0.1042, -0.1684]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02191118 -0.1542235   0.0068541   0.31852886]\n",
      "2= tensor([[0.0324, 0.1756]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01882671 0.04080016 0.01322467 0.02801532]\n",
      "2= tensor([[-0.1017, -0.1626]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01964272 -0.15450892  0.01378498  0.32484126]\n",
      "2= tensor([[0.0345, 0.1801]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01655254 0.04041407 0.0202818  0.03653722]\n",
      "2= tensor([[-0.0979, -0.1524]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01736082  0.2352394   0.02101255 -0.24967822]\n",
      "2= tensor([[-0.2425, -0.5898]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02206561 0.03982377 0.01601898 0.04955774]\n",
      "2= tensor([[-0.0946, -0.1411]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02286208 -0.15552416  0.01701014  0.34725145]\n",
      "2= tensor([[0.0403, 0.1920]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0197516  -0.3508839   0.02395517  0.64524937]\n",
      "2= tensor([[0.1085, 0.3394]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01273392 -0.1561038   0.03686016  0.3602052 ]\n",
      "2= tensor([[0.0449, 0.2027]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00961185 0.03847533 0.04406426 0.0793692 ]\n",
      "2= tensor([[-0.0806, -0.1045]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01038135 -0.15724969  0.04565164  0.38562244]\n",
      "2= tensor([[0.0518, 0.2175]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00723636 0.03719544 0.05336409 0.10767554]\n",
      "2= tensor([[-0.0700, -0.0741]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00798027 -0.158649    0.0555176   0.41670564]\n",
      "2= tensor([[0.0600, 0.2340]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00480729 -0.354512    0.06385171  0.7263613 ]\n",
      "2= tensor([[0.1121, 0.3602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00228295 -0.16032828  0.07837894  0.45443892]\n",
      "2= tensor([[0.0685, 0.2534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00548952  0.03360297  0.08746772  0.18745492]\n",
      "2= tensor([[-0.0406,  0.0069]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00481746  0.2273717   0.09121682 -0.07640431]\n",
      "2= tensor([[-0.1726, -0.3846]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00027002  0.03106851  0.08968873  0.2436069 ]\n",
      "2= tensor([[-0.0230,  0.0513]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00035135  0.22480254  0.09456087 -0.01949299]\n",
      "2= tensor([[-0.1516, -0.3215]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0048474  0.02846063 0.09417101 0.3014636 ]\n",
      "2= tensor([[-0.0042,  0.0965]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00541661 0.22212304 0.10020028 0.03990249]\n",
      "2= tensor([[-0.1313, -0.2589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00985907  0.41567603  0.10099833 -0.21956111]\n",
      "2= tensor([[-0.2614, -0.6563]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01817259 0.21926627 0.09660711 0.10319521]\n",
      "2= tensor([[-0.1112, -0.1952]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02255792  0.41288054  0.09867101 -0.15751368]\n",
      "2= tensor([[-0.2429, -0.5949]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03081553 0.2164945  0.09552074 0.16459477]\n",
      "2= tensor([[-0.0916, -0.1337]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03514542 0.02014417 0.09881263 0.48581803]\n",
      "2= tensor([[0.0421, 0.2091]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0355483  0.21374306 0.10852899 0.22583993]\n",
      "2= tensor([[-0.0702, -0.0733]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03982316 0.01725091 0.1130458  0.550689  ]\n",
      "2= tensor([[0.0538, 0.2348]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04016818 0.21061872 0.12405957 0.29565334]\n",
      "2= tensor([[-0.0453, -0.0144]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04438055 0.4037738  0.12997264 0.04452747]\n",
      "2= tensor([[-0.1763, -0.3845]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05245603 0.20705085 0.13086319 0.3752275 ]\n",
      "2= tensor([[-0.0198,  0.0463]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05659705 0.40009478 0.13836774 0.12650155]\n",
      "2= tensor([[-0.1490, -0.3007]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06459894 0.20328978 0.14089777 0.45943803]\n",
      "2= tensor([[0.0079, 0.1106]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06866474 0.39616826 0.15008654 0.21427436]\n",
      "2= tensor([[-0.1185, -0.2102]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0765881  0.19925487 0.15437202 0.5502839 ]\n",
      "2= tensor([[0.0277, 0.1661]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0805732  0.39191005 0.16537769 0.30994296]\n",
      "2= tensor([[-0.0815, -0.1161]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08841141 0.19486552 0.17157656 0.64987683]\n",
      "2= tensor([[0.0446, 0.2123]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09230871 0.38723487 0.1845741  0.4157561 ]\n",
      "2= tensor([[-0.0383, -0.0260]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.10005341 0.579327   0.19288921 0.18646929]\n",
      "2= tensor([[-0.1732, -0.3727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11163995 0.38204378 0.1966186  0.53326446]\n",
      "2= tensor([[-0.0016,  0.0583]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11928082 0.1847792  0.20728388 0.8808943 ]\n",
      "2= tensor([[0.0845, 0.2830]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01983754  0.01336598  0.01580483 -0.04708039]\n",
      "2= tensor([[-0.1165, -0.2103]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01957022 -0.181979    0.01486322  0.2505469 ]\n",
      "2= tensor([[0.0215, 0.1541]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0232098   0.01292759  0.01987416 -0.03741105]\n",
      "2= tensor([[-0.1122, -0.1977]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02295125 -0.18247364  0.01912594  0.26147553]\n",
      "2= tensor([[0.0251, 0.1621]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02660072 -0.37786332  0.02435545  0.5601291 ]\n",
      "2= tensor([[0.1046, 0.3245]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03415798 -0.18309152  0.03555803  0.27521786]\n",
      "2= tensor([[0.0304, 0.1746]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03781981  0.01150554  0.04106239 -0.00604136]\n",
      "2= tensor([[-0.0975, -0.1568]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03758971 -0.18418051  0.04094156  0.29930925]\n",
      "2= tensor([[0.0374, 0.1900]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04127331 -0.3798614   0.04692775  0.6046181 ]\n",
      "2= tensor([[0.1061, 0.3376]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04887054 -0.18542606  0.05902011  0.32707784]\n",
      "2= tensor([[0.0456, 0.2091]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05257906  0.00880813  0.06556167  0.05357568]\n",
      "2= tensor([[-0.0739, -0.0877]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0524029  -0.18718964  0.06663318  0.36620203]\n",
      "2= tensor([[0.0559, 0.2312]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05614669  0.00692526  0.07395722  0.09525151]\n",
      "2= tensor([[-0.0594, -0.0429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05600819 -0.18917449  0.07586225  0.41032067]\n",
      "2= tensor([[0.0656, 0.2519]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05979168  0.00479459  0.08406866  0.14248599]\n",
      "2= tensor([[-0.0444,  0.0034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05969579  0.1986182   0.08691838 -0.12253556]\n",
      "2= tensor([[-0.1773, -0.3960]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05572342  0.00236547  0.08446767  0.19625409]\n",
      "2= tensor([[-0.0283,  0.0471]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05567611  0.19618401  0.08839276 -0.06863322]\n",
      "2= tensor([[-0.1580, -0.3360]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-5.1752433e-02 -8.6703294e-05  8.7020092e-02  2.5057709e-01]\n",
      "2= tensor([[-0.0108,  0.0892]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05175417  0.19369178  0.09203163 -0.01343913]\n",
      "2= tensor([[-0.1382, -0.2752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04788033 -0.00262127  0.09176285  0.30680338]\n",
      "2= tensor([[0.0054, 0.1300]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04793276  0.19108145  0.09789892  0.04441218]\n",
      "2= tensor([[-0.1173, -0.2127]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04411113 -0.0052981   0.09878716  0.36630735]\n",
      "2= tensor([[0.0223, 0.1714]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04421709  0.18829142  0.10611331  0.10633504]\n",
      "2= tensor([[-0.0958, -0.1470]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04045126 -0.00817852  0.10824001  0.4305211 ]\n",
      "2= tensor([[0.0385, 0.2080]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04061483  0.18525757  0.11685043  0.17382549]\n",
      "2= tensor([[-0.0725, -0.0763]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03690968  0.37853014  0.12032694 -0.07983052]\n",
      "2= tensor([[-0.2024, -0.4663]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02933908  0.18190718  0.11873033  0.2482622 ]\n",
      "2= tensor([[-0.0488, -0.0136]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02570093  0.37515107  0.12369557 -0.00473814]\n",
      "2= tensor([[-0.1790, -0.3909]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01819791  0.17849222  0.12360081  0.32427007]\n",
      "2= tensor([[-0.0258,  0.0446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01462807  0.37165737  0.13008621  0.07297897]\n",
      "2= tensor([[-0.1527, -0.3095]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00719492  0.17493366  0.1315458   0.40370885]\n",
      "2= tensor([[-0.0008,  0.1051]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00369625  0.3679686   0.13961996  0.1552211 ]\n",
      "2= tensor([[-0.1247, -0.2243]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00366312 0.17115238 0.1427244  0.4884876 ]\n",
      "2= tensor([[0.0218, 0.1631]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00708617 0.36400276 0.15249415 0.24397202]\n",
      "2= tensor([[-0.0935, -0.1322]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01436623 0.1670689  0.15737358 0.5806045 ]\n",
      "2= tensor([[0.0373, 0.2095]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0177076  0.35967633 0.16898566 0.3413407 ]\n",
      "2= tensor([[-0.0546, -0.0460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02490113 0.55204165 0.17581248 0.10634851]\n",
      "2= tensor([[-0.1885, -0.4056]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03594196 0.35489318 0.17793946 0.44893557]\n",
      "2= tensor([[-0.0181,  0.0359]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04303983 0.15775955 0.18691817 0.7920056 ]\n",
      "2= tensor([[0.0729, 0.2780]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04619502 0.34989107 0.20275828 0.5634628 ]\n",
      "2= tensor([[0.0149, 0.1156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03659784 -0.00668592 -0.04393609  0.00625349]\n",
      "2= tensor([[-0.1065, -0.1677]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03646412 -0.20115113 -0.04381102  0.28475675]\n",
      "2= tensor([[0.0295, 0.1647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0324411  -0.0054326  -0.03811589 -0.02141566]\n",
      "2= tensor([[-0.1152, -0.1956]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03233245 -0.19998778 -0.0385442   0.2590018 ]\n",
      "2= tensor([[0.0230, 0.1494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02833269 -0.00433738 -0.03336417 -0.04558503]\n",
      "2= tensor([[-0.1226, -0.2198]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02824594 -0.19896542 -0.03427587  0.23638731]\n",
      "2= tensor([[0.0169, 0.1354]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02426663 -0.00337096 -0.02954812 -0.06690718]\n",
      "2= tensor([[-0.1295, -0.2420]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02419921 -0.1980571  -0.03088626  0.21630865]\n",
      "2= tensor([[0.0114, 0.1230]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02023807 -0.00250752 -0.02656009 -0.08595492]\n",
      "2= tensor([[-0.1356, -0.2619]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02018792 -0.19723889 -0.02827919  0.19823135]\n",
      "2= tensor([[0.0064, 0.1118]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01624314 -0.00172411 -0.02431456 -0.10323653]\n",
      "2= tensor([[-0.1412, -0.2797]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01620866 -0.19648932 -0.02637929  0.18167716]\n",
      "2= tensor([[0.0018, 0.1017]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01227888 -0.00100003 -0.02274575 -0.11920937]\n",
      "2= tensor([[-0.1464, -0.2960]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01225888  0.1944403  -0.02512994 -0.41898072]\n",
      "2= tensor([[-0.2923, -0.7454]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01614768 -0.0003167  -0.03350955 -0.13432486]\n",
      "2= tensor([[-0.1535, -0.3152]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01614135 -0.19494304 -0.03619605  0.14760078]\n",
      "2= tensor([[-0.0082,  0.0757]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01224249  0.00067805 -0.03324403 -0.15627795]\n",
      "2= tensor([[-0.1608, -0.3386]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01225605 -0.19395255 -0.03636959  0.12573467]\n",
      "2= tensor([[-0.0151,  0.0596]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.008377    0.00167105 -0.0338549  -0.17819698]\n",
      "2= tensor([[-0.1681, -0.3618]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00841042 -0.19295047 -0.03741884  0.1036166 ]\n",
      "2= tensor([[-0.0218,  0.0429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00455141  0.00268719 -0.0353465  -0.20063306]\n",
      "2= tensor([[-0.1757, -0.3857]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00460515 -0.19191186 -0.03935917  0.0806935 ]\n",
      "2= tensor([[-0.0289,  0.0255]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00076691  0.00375155 -0.0377453  -0.22414294]\n",
      "2= tensor([[-0.1837, -0.4107]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00084195 -0.19081117 -0.04222815  0.05639879]\n",
      "2= tensor([[-0.0367,  0.0042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00297428  0.00489003 -0.04110018 -0.2493027 ]\n",
      "2= tensor([[-0.1924, -0.4376]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00287648 -0.18962161 -0.04608623  0.03013832]\n",
      "2= tensor([[-0.0459, -0.0211]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00666891  0.0061299  -0.04548347 -0.27672175]\n",
      "2= tensor([[-0.2020, -0.4671]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00654631 -0.18831463 -0.0510179   0.00127588]\n",
      "2= tensor([[-0.0564, -0.0501]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0103126   0.00750046 -0.05099238 -0.30705735]\n",
      "2= tensor([[-0.2125, -0.5011]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0101626  -0.18685919 -0.05713353 -0.03088208]\n",
      "2= tensor([[-0.0681, -0.0832]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01389978 -0.38111725 -0.05775118  0.24324144]\n",
      "2= tensor([[0.0565, 0.2065]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02152212 -0.18521999 -0.05288634 -0.06708398]\n",
      "2= tensor([[-0.0789, -0.1170]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02522652 -0.3795454  -0.05422802  0.20845523]\n",
      "2= tensor([[0.0491, 0.1915]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03281743 -0.18369165 -0.05005892 -0.10082875]\n",
      "2= tensor([[-0.0889, -0.1484]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03649126 -0.37806177 -0.05207549  0.17565002]\n",
      "2= tensor([[0.0407, 0.1750]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0440525  -0.18223472 -0.04856249 -0.13299564]\n",
      "2= tensor([[-0.0984, -0.1782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04769719 -0.37662864 -0.05122241  0.14397971]\n",
      "2= tensor([[0.0323, 0.1584]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05522977 -0.18081194 -0.04834281 -0.16441287]\n",
      "2= tensor([[-0.1080, -0.2087]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.058846   -0.37520972 -0.05163107  0.11263589]\n",
      "2= tensor([[0.0236, 0.1404]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0663502  -0.17938744 -0.04937835 -0.19587892]\n",
      "2= tensor([[-0.1183, -0.2423]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06993795 -0.37376958 -0.05329593  0.08082756]\n",
      "2= tensor([[0.0148, 0.1217]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07741334 -0.17792574 -0.05167938 -0.22818267]\n",
      "2= tensor([[-0.1290, -0.2770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08097185 -0.37227252 -0.05624303  0.04776133]\n",
      "2= tensor([[0.0056, 0.1020]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08841731 -0.17639108 -0.05528781 -0.26212296]\n",
      "2= tensor([[-0.1396, -0.3127]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09194513  0.0194747  -0.06053027 -0.57171905]\n",
      "2= tensor([[-0.3077, -0.7968]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09155563 -0.17474857 -0.07196464 -0.29870275]\n",
      "2= tensor([[-0.1528, -0.3545]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0950506  -0.36877486 -0.07793871 -0.02955596]\n",
      "2= tensor([[-0.0164,  0.0491]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1024261  -0.17262675 -0.07852982 -0.34577575]\n",
      "2= tensor([[-0.1708, -0.4096]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10587864 -0.36654893 -0.08544534 -0.07885301]\n",
      "2= tensor([[-0.0298,  0.0075]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11320961 -0.1703126  -0.08702239 -0.39722398]\n",
      "2= tensor([[-0.1935, -0.4748]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11661587 -0.3640991  -0.09496687 -0.1331965 ]\n",
      "2= tensor([[-0.0471, -0.0477]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12389785 -0.55774146 -0.09763081  0.12807997]\n",
      "2= tensor([[0.0598, 0.2064]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13505268 -0.36136633 -0.09506921 -0.19373791]\n",
      "2= tensor([[-0.0689, -0.1125]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14228    -0.16502208 -0.09894396 -0.5148326 ]\n",
      "2= tensor([[-0.2476, -0.6289]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14558044 -0.3586216  -0.10924061 -0.25489575]\n",
      "2= tensor([[-0.0970, -0.1918]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.15275288 -0.552028   -0.11433853  0.00143167]\n",
      "2= tensor([[0.0279, 0.1365]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.16379344 -0.35546774 -0.1143099  -0.3250259 ]\n",
      "2= tensor([[-0.1264, -0.2787]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.17090279 -0.5487923  -0.12081042 -0.07046558]\n",
      "2= tensor([[0.0063, 0.0855]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.18187864 -0.3521641  -0.12221973 -0.39869004]\n",
      "2= tensor([[-0.1588, -0.3740]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18892191 -0.54535943 -0.13019353 -0.14690197]\n",
      "2= tensor([[-0.0218,  0.0200]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1998291  -0.3486367  -0.13313156 -0.4776576 ]\n",
      "2= tensor([[-0.1947, -0.4782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.20680185 -0.5416525  -0.14268471 -0.22972097]\n",
      "2= tensor([[-0.0553, -0.0677]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.21763489 -0.7344778  -0.14727914  0.01477061]\n",
      "2= tensor([[0.0578, 0.1848]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.23232445 -0.53758436 -0.14698373 -0.32051593]\n",
      "2= tensor([[-0.0923, -0.1797]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.24307613 -0.7303408  -0.15339404 -0.07755679]\n",
      "2= tensor([[0.0287, 0.1242]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.25768295 -0.5333906  -0.15494518 -0.4144344 ]\n",
      "2= tensor([[-0.1338, -0.3012]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.26835075 -0.726016   -0.16323388 -0.17432964]\n",
      "2= tensor([[-0.0105,  0.0460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.2828711  -0.52897996 -0.16672046 -0.5137328 ]\n",
      "2= tensor([[-0.1814, -0.4371]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.29345068 -0.7214099  -0.17699511 -0.27787915]\n",
      "2= tensor([[-0.0530, -0.0562]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.30787888 -0.91362345 -0.1825527  -0.04582854]\n",
      "2= tensor([[0.0622, 0.1783]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.32615134 -0.71641713 -0.18346927 -0.3900956 ]\n",
      "2= tensor([[-0.0998, -0.1912]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.3404797  -0.9085257  -0.19127119 -0.16040689]\n",
      "2= tensor([[0.0232, 0.0991]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.3586502  -0.7112535  -0.19447932 -0.5068103 ]\n",
      "2= tensor([[-0.1559, -0.3449]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.37287527 -0.90318006 -0.20461553 -0.2811648 ]\n",
      "2= tensor([[-0.0312, -0.0159]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01047841  0.03525236 -0.02611265  0.00975346]\n",
      "2= tensor([[-0.1077, -0.1671]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00977336 -0.15948556 -0.02591758  0.29408452]\n",
      "2= tensor([[0.0269, 0.1680]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01296307  0.03599613 -0.02003589 -0.00665846]\n",
      "2= tensor([[-0.1124, -0.1836]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01224315 -0.15883283 -0.02016906  0.27963617]\n",
      "2= tensor([[0.0231, 0.1599]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0154198  -0.35366136 -0.01457633  0.5658902 ]\n",
      "2= tensor([[0.1040, 0.3207]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02249303 -0.15833798 -0.00325853  0.26865098]\n",
      "2= tensor([[0.0211, 0.1564]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02565979  0.03683033  0.00211449 -0.02505794]\n",
      "2= tensor([[-0.1150, -0.1976]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02492318 -0.15832189  0.00161333  0.26829138]\n",
      "2= tensor([[0.0213, 0.1570]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02808962  0.036777    0.00697916 -0.02388225]\n",
      "2= tensor([[-0.1138, -0.1951]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02735408 -0.15844433  0.00650151  0.27099448]\n",
      "2= tensor([[0.0224, 0.1597]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03052297  0.03658424  0.0119214  -0.01963076]\n",
      "2= tensor([[-0.1115, -0.1893]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02979128 -0.15870664  0.01152879  0.27678955]\n",
      "2= tensor([[0.0244, 0.1642]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03296542  0.03624896  0.01706458 -0.01223503]\n",
      "2= tensor([[-0.1082, -0.1803]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03224044 -0.15911351  0.01681988  0.28578275]\n",
      "2= tensor([[0.0274, 0.1709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03542271 -0.35447124  0.02253553  0.5837227 ]\n",
      "2= tensor([[0.1035, 0.3277]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04251213 -0.15967213  0.03420999  0.29822314]\n",
      "2= tensor([[0.0323, 0.1822]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04570558  0.03494589  0.04017445  0.01652268]\n",
      "2= tensor([[-0.0949, -0.1442]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04500666 -0.1607285   0.0405049   0.32160553]\n",
      "2= tensor([[0.0386, 0.1963]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04822123  0.03379394  0.04693701  0.04196639]\n",
      "2= tensor([[-0.0856, -0.1166]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04754535 -0.16196856  0.04777634  0.34908116]\n",
      "2= tensor([[0.0460, 0.2128]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05078472  0.03244249  0.05475796  0.07183824]\n",
      "2= tensor([[-0.0748, -0.0843]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05013587 -0.16341999  0.05619473  0.38128242]\n",
      "2= tensor([[0.0544, 0.2304]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05340427  0.03086086  0.06382038  0.1068337 ]\n",
      "2= tensor([[-0.0625, -0.0468]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05278705  0.22501294  0.06595705 -0.16505107]\n",
      "2= tensor([[-0.1998, -0.4605]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04828679  0.02901186  0.06265603  0.1476886 ]\n",
      "2= tensor([[-0.0506, -0.0096]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04770656  0.22318321  0.06560981 -0.12458809]\n",
      "2= tensor([[-0.1868, -0.4181]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04324289  0.02718566  0.06311804  0.18805113]\n",
      "2= tensor([[-0.0386,  0.0227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04269918  0.22135046  0.06687906 -0.08407172]\n",
      "2= tensor([[-0.1728, -0.3740]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03827217  0.02533673  0.06519763  0.22893935]\n",
      "2= tensor([[-0.0253,  0.0543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03776544  0.21946934  0.06977642 -0.04248635]\n",
      "2= tensor([[-0.1580, -0.3290]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03337605  0.02341979  0.06892669  0.27137   ]\n",
      "2= tensor([[-0.0112,  0.0871]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03290765  0.21749395  0.07435409  0.00119841]\n",
      "2= tensor([[-0.1421, -0.2816]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02855777  0.41147515  0.07437806 -0.26712948]\n",
      "2= tensor([[-0.2734, -0.6867]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02032827  0.21537484  0.06903547  0.04805472]\n",
      "2= tensor([[-0.1270, -0.2349]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01602077  0.01933438  0.06999657  0.36169526]\n",
      "2= tensor([[0.0139, 0.1490]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01563409  0.21339522  0.07723047  0.09187901]\n",
      "2= tensor([[-0.1118, -0.1893]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01136618  0.01725614  0.07906805  0.40789387]\n",
      "2= tensor([[0.0263, 0.1794]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01102106  0.21117316  0.08722593  0.14114888]\n",
      "2= tensor([[-0.0947, -0.1378]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00679759  0.01491727  0.0900489   0.46002546]\n",
      "2= tensor([[0.0389, 0.2070]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00649925  0.20865868  0.09924942  0.19702941]\n",
      "2= tensor([[-0.0757, -0.0811]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00232608  0.01226752  0.10319     0.5192979 ]\n",
      "2= tensor([[0.0498, 0.2314]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00208073  0.20579691  0.11357596  0.26083204]\n",
      "2= tensor([[-0.0525, -0.0256]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00203521 0.3991298  0.1187926  0.00602069]\n",
      "2= tensor([[-0.1847, -0.4061]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01001781 0.20252225 0.11891301 0.33369657]\n",
      "2= tensor([[-0.0308,  0.0292]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01406825 0.39576873 0.12558694 0.08075196]\n",
      "2= tensor([[-0.1594, -0.3281]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02198363 0.19909114 0.12720199 0.41027048]\n",
      "2= tensor([[-0.0054,  0.0881]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02596545 0.39220187 0.13540739 0.16024126]\n",
      "2= tensor([[-0.1328, -0.2469]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03380949 0.19542739 0.13861221 0.49238944]\n",
      "2= tensor([[0.0182, 0.1464]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03771804 0.38835    0.14846    0.24640271]\n",
      "2= tensor([[-0.1025, -0.1580]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04548503 0.19145404 0.15338807 0.581985  ]\n",
      "2= tensor([[0.0337, 0.1929]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04931412 0.3841319  0.16502777 0.34128097]\n",
      "2= tensor([[-0.0645, -0.0721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05699676 0.5765685  0.17185338 0.10484601]\n",
      "2= tensor([[-0.1991, -0.4367]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.06852812  0.7688644   0.1739503  -0.1290724 ]\n",
      "2= tensor([[-0.3217, -0.7999]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08390541 0.5717327  0.17136885 0.21304664]\n",
      "2= tensor([[-0.1624, -0.3324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09534007 0.37462786 0.17562978 0.5545094 ]\n",
      "2= tensor([[0.0052, 0.0824]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.10283262 0.5669054  0.18671997 0.3219    ]\n",
      "2= tensor([[-0.1195, -0.2223]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11417073 0.36968347 0.19315797 0.6671681 ]\n",
      "2= tensor([[0.0287, 0.1403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.1215644  0.56166935 0.20650133 0.44098076]\n",
      "2= tensor([[-0.0682, -0.1128]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02335742  0.00177691  0.021033   -0.02293805]\n",
      "2= tensor([[-0.1100, -0.1963]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02339296 -0.19364026  0.02057424  0.27630612]\n",
      "2= tensor([[0.0290, 0.1641]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01952015  0.00118221  0.02610036 -0.00981734]\n",
      "2= tensor([[-0.1042, -0.1796]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0195438  -0.19430414  0.02590401  0.29098496]\n",
      "2= tensor([[0.0337, 0.1747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01565771 0.00043905 0.03172371 0.00658309]\n",
      "2= tensor([[-0.0972, -0.1592]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01566649 -0.19512315  0.03185537  0.30910403]\n",
      "2= tensor([[0.0389, 0.1864]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01176403 -0.00046923  0.03803745  0.02663516]\n",
      "2= tensor([[-0.0890, -0.1353]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01175465  0.19408718  0.03857015 -0.25380805]\n",
      "2= tensor([[-0.2326, -0.5674]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01563639 -0.00156367  0.033494    0.05078677]\n",
      "2= tensor([[-0.0820, -0.1119]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01560512 -0.19714949  0.03450973  0.35384634]\n",
      "2= tensor([[0.0506, 0.2117]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01166213 -0.0025348   0.04158666  0.07224196]\n",
      "2= tensor([[-0.0740, -0.0879]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01161143 -0.19822751  0.0430315   0.3777502 ]\n",
      "2= tensor([[0.0572, 0.2252]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00764688 -0.00374228  0.0505865   0.09893976]\n",
      "2= tensor([[-0.0642, -0.0584]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00757204  0.19061954  0.0525653  -0.17736393]\n",
      "2= tensor([[-0.2043, -0.4793]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01138443 -0.00521371  0.04901802  0.13142729]\n",
      "2= tensor([[-0.0543, -0.0277]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01128015  0.18917306  0.05164656 -0.1453971 ]\n",
      "2= tensor([[-0.1935, -0.4445]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01506361 -0.00664902  0.04873862  0.16312169]\n",
      "2= tensor([[-0.0445,  0.0003]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01493063 -0.20243359  0.05200106  0.47077328]\n",
      "2= tensor([[0.0767, 0.2654]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01088196 -0.00808324  0.06141652  0.19492325]\n",
      "2= tensor([[-0.0331,  0.0279]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0107203   0.18610887  0.06531499 -0.07777061]\n",
      "2= tensor([[-0.1675, -0.3664]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01444247 -0.00988566  0.06375957  0.23478326]\n",
      "2= tensor([[-0.0199,  0.0589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01424476  0.18427011  0.06845524 -0.03712601]\n",
      "2= tensor([[-0.1521, -0.3207]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01793016 -0.01176331  0.06771272  0.27634555]\n",
      "2= tensor([[-0.0061,  0.0915]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0176949  0.18233053 0.07323963 0.00576431]\n",
      "2= tensor([[-0.1366, -0.2747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02134151 -0.0137612   0.07335491  0.3206266 ]\n",
      "2= tensor([[0.0079, 0.1245]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02106628 0.1802436  0.07976744 0.05194898]\n",
      "2= tensor([[-0.1202, -0.2261]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02467115 -0.01592614  0.08080643  0.3686947 ]\n",
      "2= tensor([[0.0213, 0.1586]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02435263 0.17796025 0.08818032 0.10254537]\n",
      "2= tensor([[-0.1025, -0.1725]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02791184  0.37171504  0.09023122 -0.1610662 ]\n",
      "2= tensor([[-0.2367, -0.5779]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03534614  0.56543714  0.08700991 -0.42397523]\n",
      "2= tensor([[-0.3659, -0.9760]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04665488  0.3691973   0.0785304  -0.10518039]\n",
      "2= tensor([[-0.2219, -0.5263]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05403883 0.17304292 0.07642679 0.2112086 ]\n",
      "2= tensor([[-0.0700, -0.0715]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05749968 -0.02308385  0.08065096  0.5269876 ]\n",
      "2= tensor([[0.0555, 0.2316]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05703801 0.1708162  0.09119072 0.26076862]\n",
      "2= tensor([[-0.0510, -0.0282]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06045433  0.3645261   0.09640609 -0.00181597]\n",
      "2= tensor([[-0.1858, -0.4149]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06774485 0.16816321 0.09636977 0.31966016]\n",
      "2= tensor([[-0.0327,  0.0162]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07110812 0.36179003 0.10276297 0.05885642]\n",
      "2= tensor([[-0.1654, -0.3531]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07834392 0.16535626 0.1039401  0.38211182]\n",
      "2= tensor([[-0.0128,  0.0636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08165105 0.35886064 0.11158234 0.12392514]\n",
      "2= tensor([[-0.1435, -0.2867]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08882826 0.16233166 0.11406084 0.4496225 ]\n",
      "2= tensor([[0.0097, 0.1151]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09207489 0.35567114 0.12305329 0.19495894]\n",
      "2= tensor([[-0.1188, -0.2136]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.09918831  0.5488377   0.12695247 -0.05651351]\n",
      "2= tensor([[-0.2525, -0.6068]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11016507 0.35214567 0.1258222  0.27337402]\n",
      "2= tensor([[-0.0905, -0.1388]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11720798 0.5452688  0.13128968 0.02287361]\n",
      "2= tensor([[-0.2283, -0.5295]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12811336 0.34853226 0.13174716 0.35392702]\n",
      "2= tensor([[-0.0602, -0.0716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.135084   0.15180711 0.13882568 0.6850792 ]\n",
      "2= tensor([[0.0537, 0.2311]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.13812014 0.3447566  0.15252727 0.43912324]\n",
      "2= tensor([[-0.0267, -0.0012]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.14501527 0.53742796 0.16130973 0.1981408 ]\n",
      "2= tensor([[-0.1654, -0.3513]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.15576383 0.34041056 0.16527256 0.53705   ]\n",
      "2= tensor([[0.0032, 0.0681]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.16257204 0.5328703  0.17601356 0.3006634 ]\n",
      "2= tensor([[-0.1256, -0.2464]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.17322946 0.33573362 0.18202682 0.64328086]\n",
      "2= tensor([[0.0285, 0.1288]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.17994413 0.5279146  0.19489244 0.41299286]\n",
      "2= tensor([[-0.0774, -0.1401]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.19050242 0.33064145 0.2031523  0.7602369 ]\n",
      "2= tensor([[0.0503, 0.1767]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03332512 -0.03958372  0.00882343  0.03130137]\n",
      "2= tensor([[-0.0845, -0.1179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03253344 -0.23483108  0.00944945  0.32675508]\n",
      "2= tensor([[0.0494, 0.2039]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02783682 -0.03984493  0.01598456  0.037067  ]\n",
      "2= tensor([[-0.0811, -0.1089]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02703992 -0.23519242  0.0167259   0.33475006]\n",
      "2= tensor([[0.0520, 0.2100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02233608 -0.04031245  0.0234209   0.04738818]\n",
      "2= tensor([[-0.0760, -0.0949]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02152983 -0.23576227  0.02436866  0.3473676 ]\n",
      "2= tensor([[0.0556, 0.2181]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01681458 -0.04099526  0.03131601  0.06246752]\n",
      "2= tensor([[-0.0699, -0.0770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01599468 -0.23655188  0.03256536  0.36486402]\n",
      "2= tensor([[0.0605, 0.2286]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01126364 -0.04190751  0.03986264  0.0826248 ]\n",
      "2= tensor([[-0.0620, -0.0538]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01042549  0.15262102  0.04151514 -0.19721967]\n",
      "2= tensor([[-0.2035, -0.4788]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01347791 -0.0430694   0.03757074  0.10826498]\n",
      "2= tensor([[-0.0541, -0.0291]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01261652  0.15149458  0.03973605 -0.17233184]\n",
      "2= tensor([[-0.1952, -0.4514]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01564641 -0.04417289  0.03628941  0.13261701]\n",
      "2= tensor([[-0.0466, -0.0065]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01476296  0.15041095  0.03894175 -0.14839984]\n",
      "2= tensor([[-0.1870, -0.4251]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01777118 -0.04524639  0.03597375  0.15630963]\n",
      "2= tensor([[-0.0394,  0.0126]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01686625  0.14934254  0.03909995 -0.12481089]\n",
      "2= tensor([[-0.1790, -0.3991]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0198531  -0.04631712  0.03660373  0.17994674]\n",
      "2= tensor([[-0.0316,  0.0310]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01892675  0.14826243  0.04020266 -0.100968  ]\n",
      "2= tensor([[-0.1704, -0.3724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.021892   -0.04741193  0.0381833   0.20412278]\n",
      "2= tensor([[-0.0235,  0.0498]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02094376  0.14714375  0.04226576 -0.07627486]\n",
      "2= tensor([[-0.1611, -0.3442]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02388664 -0.04855783  0.04074026  0.22943777]\n",
      "2= tensor([[-0.0150,  0.0697]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02291548  0.14595897  0.04532902 -0.050121  ]\n",
      "2= tensor([[-0.1513, -0.3152]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02583466 -0.04978265  0.0443266   0.25651202]\n",
      "2= tensor([[-0.0058,  0.0909]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02483901  0.14467934  0.04945683 -0.02186669]\n",
      "2= tensor([[-0.1406, -0.2841]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0277326  -0.05111571  0.0490195   0.28600115]\n",
      "2= tensor([[0.0041, 0.1134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02671028 0.14327411 0.05473953 0.00917263]\n",
      "2= tensor([[-0.1289, -0.2499]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02957577 -0.05258841  0.05492298  0.31861174]\n",
      "2= tensor([[0.0136, 0.1371]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.028524   0.14171004 0.06129521 0.04374278]\n",
      "2= tensor([[-0.1163, -0.2133]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0313582  -0.05423485  0.06217007  0.35511768]\n",
      "2= tensor([[0.0242, 0.1634]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0302735  0.13995057 0.06927242 0.08266848]\n",
      "2= tensor([[-0.1022, -0.1719]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03307251 -0.05609248  0.07092579  0.3963776 ]\n",
      "2= tensor([[0.0358, 0.1874]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03195066 0.13795526 0.07885335 0.12687251]\n",
      "2= tensor([[-0.0863, -0.1254]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03470977 -0.05820259  0.08139079  0.44335386]\n",
      "2= tensor([[0.0479, 0.2129]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03354572 0.13567907 0.09025787 0.17739658]\n",
      "2= tensor([[-0.0689, -0.0731]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0362593  -0.06061084  0.0938058   0.49713275]\n",
      "2= tensor([[0.0582, 0.2353]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03504708 0.13307193 0.10374846 0.2354244 ]\n",
      "2= tensor([[-0.0476, -0.0198]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03770852  0.32657036  0.10845695 -0.02281525]\n",
      "2= tensor([[-0.1804, -0.4049]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04423993 0.13007368 0.10800064 0.30202183]\n",
      "2= tensor([[-0.0278,  0.0309]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0468414  0.3235039  0.11404108 0.04525749]\n",
      "2= tensor([[-0.1573, -0.3338]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05331148 0.12694705 0.11494622 0.37163308]\n",
      "2= tensor([[-0.0057,  0.0847]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05585042 0.32026437 0.12237889 0.1172905 ]\n",
      "2= tensor([[-0.1328, -0.2592]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06225571 0.12362085 0.1247247  0.4459394 ]\n",
      "2= tensor([[0.0171, 0.1399]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06472813 0.31677797 0.1336435  0.19502845]\n",
      "2= tensor([[-0.1062, -0.1784]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07106368 0.12002266 0.13754405 0.526704  ]\n",
      "2= tensor([[0.0346, 0.1875]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07346413 0.31296852 0.14807814 0.28032917]\n",
      "2= tensor([[-0.0739, -0.0939]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07972351 0.11607871 0.15368472 0.6158079 ]\n",
      "2= tensor([[0.0493, 0.2277]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08204508 0.3087574  0.16600087 0.37520197]\n",
      "2= tensor([[-0.0378, -0.0139]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08822023 0.5011804  0.17350492 0.13911562]\n",
      "2= tensor([[-0.1722, -0.3678]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09824383 0.30405292 0.17628723 0.48112217]\n",
      "2= tensor([[-0.0032,  0.0649]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.10432489 0.49630564 0.18590967 0.24877289]\n",
      "2= tensor([[-0.1317, -0.2543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11425101 0.2990827  0.19088513 0.59385276]\n",
      "2= tensor([[0.0256, 0.1361]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.12023266 0.49109265 0.20276219 0.3668492 ]\n",
      "2= tensor([[-0.0819, -0.1382]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04503054 -0.00145921  0.04811621 -0.04149099]\n",
      "2= tensor([[-0.1157, -0.2249]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04500136 -0.19723694  0.04728639  0.26597643]\n",
      "2= tensor([[0.0265, 0.1551]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04105662 -0.00282065  0.05260592 -0.01142501]\n",
      "2= tensor([[-0.1038, -0.1890]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04100021  0.19150893  0.05237743 -0.28705713]\n",
      "2= tensor([[-0.2454, -0.6152]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04483038 -0.00431933  0.04663628  0.02167435]\n",
      "2= tensor([[-0.0928, -0.1531]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.044744   -0.200078    0.04706977  0.32869917]\n",
      "2= tensor([[0.0441, 0.1929]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04074244 -0.00565663  0.05364375  0.05122354]\n",
      "2= tensor([[-0.0812, -0.1185]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0406293  -0.2015051   0.05466822  0.36033735]\n",
      "2= tensor([[0.0530, 0.2121]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0365992  -0.00720113  0.06187497  0.08538128]\n",
      "2= tensor([[-0.0691, -0.0813]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03645518 -0.20315294  0.0635826   0.39692616]\n",
      "2= tensor([[0.0628, 0.2323]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03239212 -0.00898799  0.07152112  0.12494794]\n",
      "2= tensor([[-0.0549, -0.0390]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03221236  0.18504032  0.07402008 -0.14434119]\n",
      "2= tensor([[-0.1928, -0.4502]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03591317 -0.01105933  0.07113326  0.17074488]\n",
      "2= tensor([[-0.0408,  0.0026]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03569198  0.1829762   0.07454816 -0.09867683]\n",
      "2= tensor([[-0.1760, -0.3987]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0393515  -0.01313061  0.07257462  0.21656325]\n",
      "2= tensor([[-0.0265,  0.0383]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03908889  0.18088284  0.07690588 -0.05237264]\n",
      "2= tensor([[-0.1588, -0.3471]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04270655 -0.01525279  0.07585843  0.26354924]\n",
      "2= tensor([[-0.0108,  0.0753]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0424015   0.17870903  0.08112941 -0.00427578]\n",
      "2= tensor([[-0.1410, -0.2942]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04597567 -0.01747705  0.0810439   0.3128613 ]\n",
      "2= tensor([[0.0059, 0.1138]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04562613 0.17640245 0.08730112 0.04679743]\n",
      "2= tensor([[-0.1227, -0.2395]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04915418 -0.01985582  0.08823707  0.36569765]\n",
      "2= tensor([[0.0207, 0.1514]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04875707 0.17390864 0.09555102 0.10208973]\n",
      "2= tensor([[-0.1034, -0.1807]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05223524 -0.02244359  0.09759282  0.42332384]\n",
      "2= tensor([[0.0356, 0.1881]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05178637 -0.21880284  0.1060593   0.74510795]\n",
      "2= tensor([[0.1028, 0.3414]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04741031 -0.0252919   0.12096146  0.48759556]\n",
      "2= tensor([[0.0497, 0.2214]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04690447 0.16793428 0.13071337 0.23535012]\n",
      "2= tensor([[-0.0548, -0.0423]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05026316  0.36097     0.13542037 -0.0134129 ]\n",
      "2= tensor([[-0.1845, -0.4215]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05748256 0.16419202 0.13515212 0.3187437 ]\n",
      "2= tensor([[-0.0289,  0.0227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0607664  0.35715622 0.14152698 0.07155076]\n",
      "2= tensor([[-0.1559, -0.3331]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06790952 0.16031884 0.142958   0.40532497]\n",
      "2= tensor([[-0.0010,  0.0895]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0711159  0.3531548  0.1510645  0.16090837]\n",
      "2= tensor([[-0.1256, -0.2402]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07817899 0.15622932 0.15428267 0.4971768 ]\n",
      "2= tensor([[0.0244, 0.1538]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08130358 0.34887776 0.1642262  0.25681594]\n",
      "2= tensor([[-0.0911, -0.1402]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08828114 0.15183856 0.16936252 0.5964638 ]\n",
      "2= tensor([[0.0412, 0.2052]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09131791 0.3442363  0.1812918  0.36155114]\n",
      "2= tensor([[-0.0488, -0.0461]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09820264 0.5363808  0.18852282 0.13106608]\n",
      "2= tensor([[-0.1835, -0.4039]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10893025 0.33912885 0.19114414 0.47679973]\n",
      "2= tensor([[-0.0097,  0.0410]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11571283 0.53111094 0.20068014 0.24992612]\n",
      "2= tensor([[-0.1388, -0.2804]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12633505 0.33377346 0.20567866 0.5985966 ]\n",
      "2= tensor([[0.0222, 0.1202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03743118  0.03766831 -0.0172803   0.01933336]\n",
      "2= tensor([[-0.1014, -0.1479]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03667781 -0.15720162 -0.01689364  0.30651444]\n",
      "2= tensor([[0.0319, 0.1820]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03982184  0.03815694 -0.01076335  0.00855193]\n",
      "2= tensor([[-0.1042, -0.1579]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0390587  -0.15680902 -0.01059231  0.29781955]\n",
      "2= tensor([[0.0298, 0.1775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04219488  0.03846232 -0.00463592  0.00181491]\n",
      "2= tensor([[-0.1056, -0.1638]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04142564 -0.15659285 -0.00459962  0.29303154]\n",
      "2= tensor([[0.0288, 0.1754]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04455749  0.03859439  0.00126101 -0.00109848]\n",
      "2= tensor([[-0.1057, -0.1657]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04378561 -0.15654562  0.00123904  0.29198205]\n",
      "2= tensor([[0.0288, 0.1757]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04691652  0.03855864  0.00707868 -0.00030985]\n",
      "2= tensor([[-0.1046, -0.1638]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04614535 -0.15666412  0.00707249  0.29459804]\n",
      "2= tensor([[0.0299, 0.1783]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04927863  0.0383563   0.01296445  0.00415405]\n",
      "2= tensor([[-0.1022, -0.1581]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04851151 -0.15694916  0.01304753  0.30089906]\n",
      "2= tensor([[0.0321, 0.1832]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05165049  0.03798442  0.01906551  0.01235945]\n",
      "2= tensor([[-0.0987, -0.1485]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0508908  -0.1574057   0.0193127   0.31099626]\n",
      "2= tensor([[0.0350, 0.1898]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05403891  0.03743586  0.02553262  0.02446602]\n",
      "2= tensor([[-0.0938, -0.1348]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0532902   0.23218252  0.02602194 -0.26005298]\n",
      "2= tensor([[-0.2356, -0.5662]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04864654  0.03669894  0.02082088  0.0407227 ]\n",
      "2= tensor([[-0.0895, -0.1201]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04791257 -0.1587153   0.02163534  0.33990142]\n",
      "2= tensor([[0.0424, 0.2055]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05108687  0.03609224  0.02843337  0.0541188 ]\n",
      "2= tensor([[-0.0840, -0.1050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05036503 -0.15942563  0.02951574  0.35563534]\n",
      "2= tensor([[0.0466, 0.2150]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05355354  0.03526451  0.03662845  0.0724037 ]\n",
      "2= tensor([[-0.0769, -0.0848]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05284825 -0.1603629   0.03807652  0.37641433]\n",
      "2= tensor([[0.0521, 0.2265]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05605551  0.03419814  0.04560481  0.09597611]\n",
      "2= tensor([[-0.0682, -0.0591]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05537155  0.2286378   0.04752433 -0.18197697]\n",
      "2= tensor([[-0.2075, -0.4797]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05079879  0.03286917  0.04388479  0.12531132]\n",
      "2= tensor([[-0.0595, -0.0320]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05014141  0.22733584  0.04639102 -0.15320987]\n",
      "2= tensor([[-0.1987, -0.4508]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04559469  0.0315814   0.04332682  0.15373996]\n",
      "2= tensor([[-0.0513, -0.0071]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04496306  0.22605705  0.04640162 -0.12496567]\n",
      "2= tensor([[-0.1893, -0.4208]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04044192  0.03030212  0.04390231  0.18198787]\n",
      "2= tensor([[-0.0427,  0.0145]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03983588  0.22476926  0.04754207 -0.09652865]\n",
      "2= tensor([[-0.1798, -0.3907]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03534049  0.0289993   0.04561149  0.21076658]\n",
      "2= tensor([[-0.0334,  0.0362]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0347605   0.22344042  0.04982682 -0.06718662]\n",
      "2= tensor([[-0.1698, -0.3597]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0302917   0.4178139   0.04848309 -0.34374198]\n",
      "2= tensor([[-0.3017, -0.7713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02193542  0.22203696  0.04160825 -0.03617318]\n",
      "2= tensor([[-0.1604, -0.3295]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01749468  0.0263438   0.04088479  0.2693418 ]\n",
      "2= tensor([[-0.0156,  0.0773]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0169678   0.22085917  0.04627162 -0.01017066]\n",
      "2= tensor([[-0.1509, -0.3021]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01255062  0.02510522  0.04606821  0.296745  ]\n",
      "2= tensor([[-0.0064,  0.0978]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01204852  0.2195412   0.05200311  0.01893971]\n",
      "2= tensor([[-0.1402, -0.2714]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00765769  0.02371353  0.0523819   0.32756615]\n",
      "2= tensor([[0.0032, 0.1199]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00718342  0.21805212  0.05893323  0.05185134]\n",
      "2= tensor([[-0.1285, -0.2378]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00282238  0.02213682  0.05997025  0.36253044]\n",
      "2= tensor([[0.0129, 0.1441]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00237964  0.21635741  0.06722086  0.08934397]\n",
      "2= tensor([[-0.1155, -0.1991]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00194751 0.02033954 0.06900774 0.40245476]\n",
      "2= tensor([[0.0238, 0.1712]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0023543  0.21441834 0.07705684 0.13230164]\n",
      "2= tensor([[-0.1004, -0.1544]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00664266 0.01828201 0.07970287 0.4482654 ]\n",
      "2= tensor([[0.0356, 0.1974]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0070083  0.2121914  0.08866818 0.18173252]\n",
      "2= tensor([[-0.0836, -0.1045]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01125213 0.01591995 0.09230283 0.50101745]\n",
      "2= tensor([[0.0459, 0.2203]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01157053 0.2096278  0.10232317 0.23879106]\n",
      "2= tensor([[-0.0629, -0.0515]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01576309  0.40315044  0.107099   -0.01994404]\n",
      "2= tensor([[-0.1966, -0.4421]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0238261  0.20666859 0.10670011 0.30451706]\n",
      "2= tensor([[-0.0420, -0.0007]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02795947 0.40012097 0.11279046 0.04729908]\n",
      "2= tensor([[-0.1741, -0.3722]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03596189 0.20357755 0.11373644 0.37333107]\n",
      "2= tensor([[-0.0203,  0.0511]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04003344 0.3969156  0.12120306 0.11856419]\n",
      "2= tensor([[-0.1503, -0.2996]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04797175 0.20028438 0.12357435 0.44689378]\n",
      "2= tensor([[0.0042, 0.1073]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05197744 0.39346135 0.13251223 0.19557643]\n",
      "2= tensor([[-0.1239, -0.2209]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05984667 0.19671738 0.13642375 0.5269498 ]\n",
      "2= tensor([[0.0238, 0.1589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06378102 0.38968268 0.14696275 0.28017548]\n",
      "2= tensor([[-0.0923, -0.1366]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07157467 0.19280341 0.15256625 0.61536264]\n",
      "2= tensor([[0.0386, 0.2013]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07543074 0.38550162 0.16487351 0.3743535 ]\n",
      "2= tensor([[-0.0541, -0.0543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08314077 0.18846858 0.17236058 0.71414864]\n",
      "2= tensor([[0.0552, 0.2420]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08691014 0.38083857 0.18664356 0.48029274]\n",
      "2= tensor([[-0.0159,  0.0287]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09452691 0.5729034  0.19624941 0.25175422]\n",
      "2= tensor([[-0.1466, -0.2964]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10598498 0.3755996  0.20128448 0.59935665]\n",
      "2= tensor([[0.0161, 0.1071]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0034902  0.0098908  0.02138443 0.00563003]\n",
      "2= tensor([[-0.0994, -0.1606]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00368801 -0.1855312   0.02149703  0.30498257]\n",
      "2= tensor([[0.0363, 0.1832]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-2.2609527e-05  9.2779128e-03  2.7596684e-02  1.9156050e-02]\n",
      "2= tensor([[-0.0937, -0.1444]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 1.6294872e-04 -1.8622871e-01  2.7979806e-02  3.2041672e-01]\n",
      "2= tensor([[0.0407, 0.1931]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00356163  0.00848383  0.03438814  0.03668722]\n",
      "2= tensor([[-0.0869, -0.1246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00339195 -0.18711394  0.03512188  0.34001854]\n",
      "2= tensor([[0.0461, 0.2053]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00713423  0.00749112  0.04192226  0.05861467]\n",
      "2= tensor([[-0.0787, -0.1002]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00698441 -0.18820606  0.04309455  0.36422408]\n",
      "2= tensor([[0.0527, 0.2196]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01074853  0.00627778  0.05037903  0.08543503]\n",
      "2= tensor([[-0.0689, -0.0708]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01062297 -0.18952876  0.05208773  0.39357737]\n",
      "2= tensor([[0.0606, 0.2356]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01441355  0.00481684  0.05995928  0.1177612 ]\n",
      "2= tensor([[-0.0573, -0.0363]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01431721 -0.19111067  0.0623145   0.4287418 ]\n",
      "2= tensor([[0.0683, 0.2520]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01813942  0.00307598  0.07088934  0.15633579]\n",
      "2= tensor([[-0.0447,  0.0016]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0180779   0.19711514  0.07401606 -0.11316791]\n",
      "2= tensor([[-0.1793, -0.4018]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0141356   0.00101495  0.0717527   0.20191787]\n",
      "2= tensor([[-0.0302,  0.0376]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0141153   0.19504127  0.07579105 -0.06729554]\n",
      "2= tensor([[-0.1622, -0.3496]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01021448 -0.00108086  0.07444514  0.24830437]\n",
      "2= tensor([[-0.0149,  0.0739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01023609  0.19290332  0.07941123 -0.01999932]\n",
      "2= tensor([[-0.1447, -0.2972]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00637803 -0.00326235  0.07901124  0.29664427]\n",
      "2= tensor([[0.0006, 0.1109]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00644327  0.19064955  0.08494413  0.029889  ]\n",
      "2= tensor([[-0.1271, -0.2447]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00263028 -0.00558134  0.08554191  0.3481176 ]\n",
      "2= tensor([[0.0149, 0.1475]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00274191  0.18822637  0.09250426  0.08358767]\n",
      "2= tensor([[-0.1083, -0.1879]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00102262 -0.00809147  0.09417602  0.40396288]\n",
      "2= tensor([[0.0297, 0.1841]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00086079 0.1855775  0.10225527 0.14239359]\n",
      "2= tensor([[-0.0878, -0.1255]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00457234 -0.01084897  0.10510314  0.4655049 ]\n",
      "2= tensor([[0.0444, 0.2159]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00435536 0.18264309 0.11441324 0.2077119 ]\n",
      "2= tensor([[-0.0656, -0.0595]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00800822  0.37595892  0.11856748 -0.04680181]\n",
      "2= tensor([[-0.1969, -0.4502]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0155274  0.17935397 0.11763144 0.28081232]\n",
      "2= tensor([[-0.0419, -0.0017]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01911448 0.37261868 0.12324769 0.02742254]\n",
      "2= tensor([[-0.1721, -0.3727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02656685 0.17596458 0.12379614 0.3563093 ]\n",
      "2= tensor([[-0.0189,  0.0557]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03008614 0.36912897 0.13092233 0.10508329]\n",
      "2= tensor([[-0.1457, -0.2921]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03746872 0.17239754 0.13302399 0.4360363 ]\n",
      "2= tensor([[0.0070, 0.1168]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04091667 0.36541033 0.14174472 0.18806873]\n",
      "2= tensor([[-0.1174, -0.2064]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04822488 0.16857497 0.1455061  0.5218942 ]\n",
      "2= tensor([[0.0271, 0.1709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05159638 0.3613814  0.15594397 0.2783687 ]\n",
      "2= tensor([[-0.0834, -0.1153]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05882401 0.16441847 0.16151135 0.61588997]\n",
      "2= tensor([[0.0427, 0.2163]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06211238 0.35695937 0.17382915 0.37811553]\n",
      "2= tensor([[-0.0442, -0.0297]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06925157 0.54924154 0.18139146 0.14488769]\n",
      "2= tensor([[-0.1794, -0.3842]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0802364  0.35204813 0.18428922 0.4888621 ]\n",
      "2= tensor([[-0.0078,  0.0520]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08727736 0.5441572  0.19406645 0.25945285]\n",
      "2= tensor([[-0.1365, -0.2667]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09816051 0.346871   0.19925551 0.6065251 ]\n",
      "2= tensor([[0.0217, 0.1257]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00719957 -0.03896508  0.02518082  0.01495905]\n",
      "2= tensor([[-0.0830, -0.1170]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00797888 -0.23443893  0.02548001  0.31547925]\n",
      "2= tensor([[0.0494, 0.2078]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01266765 -0.03968902  0.03178959  0.03093952]\n",
      "2= tensor([[-0.0766, -0.0982]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01346143 -0.23525208  0.03240838  0.33348048]\n",
      "2= tensor([[0.0544, 0.2191]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01816648 -0.04060603  0.03907799  0.05119111]\n",
      "2= tensor([[-0.0688, -0.0749]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0189786  -0.2362659   0.04010181  0.35594285]\n",
      "2= tensor([[0.0604, 0.2318]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02370391 -0.04173637  0.04722067  0.07616992]\n",
      "2= tensor([[-0.0594, -0.0467]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02453864  0.15267794  0.04874407 -0.20124876]\n",
      "2= tensor([[-0.2007, -0.4689]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02148508 -0.04310603  0.04471909  0.10640346]\n",
      "2= tensor([[-0.0501, -0.0179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0223472   0.1513475   0.04684716 -0.1718422 ]\n",
      "2= tensor([[-0.1907, -0.4364]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01932025 -0.04441256  0.04341032  0.13524376]\n",
      "2= tensor([[-0.0419,  0.0081]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02020851  0.15006158  0.04611519 -0.143434  ]\n",
      "2= tensor([[-0.1810, -0.4050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01720727 -0.04568943  0.04324651  0.1634334 ]\n",
      "2= tensor([[-0.0328,  0.0301]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01812106  0.1487876   0.04651518 -0.11529888]\n",
      "2= tensor([[-0.1711, -0.3737]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01514531 -0.04696891  0.0442092   0.1916888 ]\n",
      "2= tensor([[-0.0237,  0.0522]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01608469  0.14749363  0.04804298 -0.08672673]\n",
      "2= tensor([[-0.1604, -0.3409]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01313482 -0.04828287  0.04630845  0.2207184 ]\n",
      "2= tensor([[-0.0141,  0.0750]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01410047  0.14614761  0.05072281 -0.05700486]\n",
      "2= tensor([[-0.1491, -0.3067]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01117752 -0.04966354  0.04958272  0.25124022]\n",
      "2= tensor([[-0.0042,  0.0983]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01217079  0.1447166   0.05460752 -0.02540031]\n",
      "2= tensor([[-0.1373, -0.2713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00927646 -0.05114422  0.05409952  0.28399962]\n",
      "2= tensor([[0.0054, 0.1227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01029934  0.14316607  0.05977951  0.00885812]\n",
      "2= tensor([[-0.1251, -0.2349]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00743602 -0.05276     0.05995667  0.31978697]\n",
      "2= tensor([[0.0157, 0.1485]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00849122  0.1414591   0.0663524   0.04659849]\n",
      "2= tensor([[-0.1115, -0.1948]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00566204 -0.05454846  0.06728438  0.35945615]\n",
      "2= tensor([[0.0274, 0.1750]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00675301  0.13955572  0.0744735   0.08872538]\n",
      "2= tensor([[-0.0961, -0.1500]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0039619  -0.05655034  0.07624801  0.40394408]\n",
      "2= tensor([[0.0395, 0.2003]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0050929   0.13741212  0.08432689  0.13624091]\n",
      "2= tensor([[-0.0793, -0.1006]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00234466 -0.0588101   0.08705171  0.4542911 ]\n",
      "2= tensor([[0.0511, 0.2251]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00352086  0.13498002  0.09613753  0.1902675 ]\n",
      "2= tensor([[-0.0609, -0.0459]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00082126  0.32860455  0.09994288 -0.07060723]\n",
      "2= tensor([[-0.1943, -0.4434]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00575083 0.13220234 0.09853074 0.25186026]\n",
      "2= tensor([[-0.0411,  0.0029]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00839488  0.32578936  0.10356794 -0.00819065]\n",
      "2= tensor([[-0.1732, -0.3775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01491066 0.12934634 0.10340413 0.31528956]\n",
      "2= tensor([[-0.0219,  0.0516]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01749759 0.32285503 0.10970992 0.05692361]\n",
      "2= tensor([[-0.1508, -0.3088]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02395469 0.12634498 0.11084839 0.38210654]\n",
      "2= tensor([[-0.0007,  0.1029]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02648159 -0.070162    0.11849052  0.7075807 ]\n",
      "2= tensor([[0.0880, 0.3101]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02507835 0.12313658 0.13264214 0.45442063]\n",
      "2= tensor([[0.0202, 0.1565]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02754108 0.3161581  0.14173055 0.20631418]\n",
      "2= tensor([[-0.0981, -0.1508]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03386424 0.11932387 0.14585683 0.54013443]\n",
      "2= tensor([[0.0369, 0.2034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03625072 0.31212693 0.15665953 0.29673073]\n",
      "2= tensor([[-0.0636, -0.0652]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04249326 0.11515906 0.16259414 0.63443416]\n",
      "2= tensor([[0.0539, 0.2423]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04479644 0.30768448 0.17528282 0.3970473 ]\n",
      "2= tensor([[-0.0276,  0.0165]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05095013 0.4999428  0.18322377 0.16434836]\n",
      "2= tensor([[-0.1588, -0.3248]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06094899 0.3027354  0.18651073 0.50877494]\n",
      "2= tensor([[0.0079, 0.0980]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0670037  0.4948077  0.19668624 0.28017986]\n",
      "2= tensor([[-0.1151, -0.2044]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07689985 0.29750347 0.20228983 0.6278837 ]\n",
      "2= tensor([[0.0322, 0.1625]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01192102  0.04656685 -0.00656225 -0.04687631]\n",
      "2= tensor([[-0.1276, -0.2340]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01098968  0.24178228 -0.00749977 -0.34162244]\n",
      "2= tensor([[-0.2726, -0.6789]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00615404  0.04676783 -0.01433222 -0.0513139 ]\n",
      "2= tensor([[-0.1306, -0.2417]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00521868 -0.1481457  -0.0153585   0.23681284]\n",
      "2= tensor([[0.0086, 0.1264]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0081816   0.04719226 -0.01062224 -0.06067476]\n",
      "2= tensor([[-0.1334, -0.2514]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00723775 -0.14777578 -0.01183574  0.22863793]\n",
      "2= tensor([[0.0065, 0.1216]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01019327  0.04751328 -0.00726298 -0.06775478]\n",
      "2= tensor([[-0.1354, -0.2586]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.009243   -0.1475038  -0.00861807  0.22262782]\n",
      "2= tensor([[0.0049, 0.1182]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01219308  0.04774027 -0.00416552 -0.07276108]\n",
      "2= tensor([[-0.1367, -0.2633]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01123827 -0.14732172 -0.00562074  0.2186047 ]\n",
      "2= tensor([[0.0040, 0.1161]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01418471  0.04788013 -0.00124865 -0.07584593]\n",
      "2= tensor([[-0.1374, -0.2661]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0132271  -0.1472239  -0.00276556  0.21644278]\n",
      "2= tensor([[0.0036, 0.1152]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01617158  0.04793748  0.00156329 -0.07711124]\n",
      "2= tensor([[-0.1373, -0.2667]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-1.5212831e-02 -1.4720684e-01  2.1066706e-05  2.1606450e-01]\n",
      "2= tensor([[0.0037, 0.1157]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01815697  0.0479148   0.00434236 -0.07661179]\n",
      "2= tensor([[-0.1366, -0.2653]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01719867 -0.14726913  0.00281012  0.217438  ]\n",
      "2= tensor([[0.0043, 0.1174]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02014405  0.04781254  0.00715888 -0.07435717]\n",
      "2= tensor([[-0.1353, -0.2617]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0191878  -0.1474113   0.00567174  0.2205758 ]\n",
      "2= tensor([[0.0054, 0.1205]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02213603  0.04762911  0.01008325 -0.07031266]\n",
      "2= tensor([[-0.1332, -0.2561]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02118345 -0.14763594  0.008677    0.22553445]\n",
      "2= tensor([[0.0071, 0.1247]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02413617 -0.34288082  0.01318769  0.52094173]\n",
      "2= tensor([[0.0993, 0.3098]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03099378 -0.5381859   0.02360652  0.817751  ]\n",
      "2= tensor([[0.1238, 0.4042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0417575  -0.3433949   0.03996154  0.53258556]\n",
      "2= tensor([[0.0990, 0.3146]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0486254  -0.14885713  0.05061325  0.25275743]\n",
      "2= tensor([[0.0180, 0.1527]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05160254  0.04550695  0.0556684  -0.02354139]\n",
      "2= tensor([[-0.1088, -0.1913]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0506924  -0.15036732  0.05519758  0.28617293]\n",
      "2= tensor([[0.0281, 0.1747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05369975  0.04392576  0.06092104  0.01139702]\n",
      "2= tensor([[-0.0961, -0.1525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05282123 -0.15201457  0.06114898  0.322662  ]\n",
      "2= tensor([[0.0381, 0.1968]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05586153  0.04218573  0.06760222  0.04987257]\n",
      "2= tensor([[-0.0821, -0.1101]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05501781 -0.15383716  0.06859966  0.36309522]\n",
      "2= tensor([[0.0488, 0.2205]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05809455  0.04024614  0.07586157  0.09280749]\n",
      "2= tensor([[-0.0672, -0.0645]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05728963  0.23420341  0.07771772 -0.17500974]\n",
      "2= tensor([[-0.2031, -0.4740]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05260556  0.03806019  0.07421753  0.14114301]\n",
      "2= tensor([[-0.0526, -0.0186]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05184436  0.23204505  0.07704039 -0.12723334]\n",
      "2= tensor([[-0.1882, -0.4245]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04720346  0.03590883  0.07449572  0.18872583]\n",
      "2= tensor([[-0.0389,  0.0204]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04648528  0.22989032  0.07827023 -0.0795579 ]\n",
      "2= tensor([[-0.1719, -0.3732]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04188747  0.03373866  0.07667908  0.23675676]\n",
      "2= tensor([[-0.0235,  0.0579]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0412127   0.22768614  0.08141422 -0.03078806]\n",
      "2= tensor([[-0.1544, -0.3203]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03665898  0.03149676  0.08079845  0.2864306 ]\n",
      "2= tensor([[-0.0073,  0.0963]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03602904  0.22537902  0.08652706  0.02028489]\n",
      "2= tensor([[-0.1358, -0.2647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03152146  0.02912961  0.08693276  0.33896494]\n",
      "2= tensor([[0.0071, 0.1336]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03093887  0.22291394  0.09371206  0.07491219]\n",
      "2= tensor([[-0.1170, -0.2072]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02648059  0.02658217  0.09521031  0.3956287 ]\n",
      "2= tensor([[0.0225, 0.1724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02594895  0.22023337  0.10312288  0.13441704]\n",
      "2= tensor([[-0.0963, -0.1446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02154428  0.02379707  0.10581122  0.4577706 ]\n",
      "2= tensor([[0.0375, 0.2070]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02106834  0.21727651  0.11496663  0.20022503]\n",
      "2= tensor([[-0.0739, -0.0768]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01672281  0.02071401  0.11897113  0.5268482 ]\n",
      "2= tensor([[0.0502, 0.2353]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01630853  0.21397872  0.1295081   0.27389538]\n",
      "2= tensor([[-0.0481, -0.0142]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01202895  0.40703788  0.134986    0.02470082]\n",
      "2= tensor([[-0.1774, -0.3846]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0038882   0.21026431  0.13548002  0.35674164]\n",
      "2= tensor([[-0.0228,  0.0487]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [3.1708862e-04 4.0322617e-01 1.4261486e-01 1.0966053e-01]\n",
      "2= tensor([[-0.1492, -0.2970]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00838161 0.20637916 0.14480807 0.44372013]\n",
      "2= tensor([[0.0052, 0.1150]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0125092  0.3991872  0.15368247 0.19996001]\n",
      "2= tensor([[-0.1183, -0.2040]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.02049294 0.20223942 0.15768166 0.5369049 ]\n",
      "2= tensor([[0.0259, 0.1721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02453773 0.39483395 0.16841976 0.2977636 ]\n",
      "2= tensor([[-0.0810, -0.1069]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03243441 0.19776171 0.17437503 0.638471  ]\n",
      "2= tensor([[0.0433, 0.2202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03638964 0.3900787  0.18714446 0.4053771 ]\n",
      "2= tensor([[-0.0390, -0.0171]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04419122 0.5821223  0.195252   0.17704123]\n",
      "2= tensor([[-0.1709, -0.3586]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05583366 0.3848202  0.19879282 0.5244111 ]\n",
      "2= tensor([[-0.0016,  0.0685]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06353007 0.5766712  0.20928104 0.30036303]\n",
      "2= tensor([[-0.1249, -0.2344]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00477566  0.00596256 -0.01447739  0.03618763]\n",
      "2= tensor([[-0.0913, -0.1245]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0046564  -0.18894883 -0.01375363  0.32426786]\n",
      "2= tensor([[0.0409, 0.1948]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00843538  0.00636623 -0.00726828  0.02727955]\n",
      "2= tensor([[-0.0933, -0.1320]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00830806 -0.18865073 -0.00672268  0.31766042]\n",
      "2= tensor([[0.0397, 0.1924]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01208107  0.00656632 -0.00036948  0.022865  ]\n",
      "2= tensor([[-0.0937, -0.1350]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-1.1949745e-02 -1.8855032e-01  8.7823319e-05  3.1543133e-01]\n",
      "2= tensor([[0.0397, 0.1925]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01572075  0.00657037  0.00639645  0.0227761 ]\n",
      "2= tensor([[-0.0927, -0.1334]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01558934 -0.18864273  0.00685197  0.31747028]\n",
      "2= tensor([[0.0406, 0.1948]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0193622   0.00638097  0.01320138  0.02695609]\n",
      "2= tensor([[-0.0903, -0.1275]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01923458  0.20131114  0.0137405  -0.2615326 ]\n",
      "2= tensor([[-0.2353, -0.5664]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01520836  0.00599576  0.00850985  0.03545239]\n",
      "2= tensor([[-0.0884, -0.1204]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01508844 -0.18924718  0.0092189   0.33080807]\n",
      "2= tensor([[0.0440, 0.2022]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01887338  0.00574234  0.01583506  0.04104653]\n",
      "2= tensor([[-0.0854, -0.1129]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01875854 -0.18960306  0.01665599  0.33868322]\n",
      "2= tensor([[0.0464, 0.2078]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0225506   0.00527797  0.02342965  0.05129884]\n",
      "2= tensor([[-0.0809, -0.1006]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02244504 -0.19017197  0.02445563  0.35128096]\n",
      "2= tensor([[0.0500, 0.2158]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02624848  0.00459382  0.03148125  0.06640889]\n",
      "2= tensor([[-0.0749, -0.0833]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0261566  -0.19096501  0.03280943  0.36885574]\n",
      "2= tensor([[0.0547, 0.2259]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0299759   0.00367577  0.04018654  0.08669594]\n",
      "2= tensor([[-0.0672, -0.0606]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02990239  0.19819933  0.04192046 -0.19304216]\n",
      "2= tensor([[-0.2081, -0.4853]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0259384   0.00250356  0.03805961  0.11256462]\n",
      "2= tensor([[-0.0595, -0.0362]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02588833  0.19706006  0.04031091 -0.16787197]\n",
      "2= tensor([[-0.1999, -0.4583]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02194713  0.00138498  0.03695347  0.13725041]\n",
      "2= tensor([[-0.0522, -0.0138]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02191943  0.19595869  0.03969848 -0.14354907]\n",
      "2= tensor([[-0.1918, -0.4324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01800025  0.00029136  0.0368275   0.161389  ]\n",
      "2= tensor([[-0.0451,  0.0057]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01799443  0.19486725  0.04005527 -0.11945213]\n",
      "2= tensor([[-0.1837, -0.4066]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01409708 -0.00080501  0.03766623  0.18559395]\n",
      "2= tensor([[-0.0372,  0.0240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01411318 -0.19644508  0.04137811  0.48991716]\n",
      "2= tensor([[0.0788, 0.2749]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01804208 -0.00193054  0.05117645  0.21055679]\n",
      "2= tensor([[-0.0277,  0.0461]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01808069  0.19242375  0.05538759 -0.06555365]\n",
      "2= tensor([[-0.1627, -0.3445]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01423222 -0.00344676  0.05407652  0.24407719]\n",
      "2= tensor([[-0.0166,  0.0720]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01430115  0.19086276  0.05895806 -0.0310703 ]\n",
      "2= tensor([[-0.1499, -0.3064]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0104839   0.38509184  0.05833666 -0.30458406]\n",
      "2= tensor([[-0.2840, -0.7201]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00278206  0.18918917  0.05224498  0.00591133]\n",
      "2= tensor([[-0.1383, -0.2699]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00100172 -0.00664162  0.0523632   0.31460974]\n",
      "2= tensor([[0.0049, 0.1218]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00086889 0.18769684 0.0586554  0.03888935]\n",
      "2= tensor([[-0.1265, -0.2358]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00462282  0.38193077  0.05943318 -0.23472568]\n",
      "2= tensor([[-0.2625, -0.6515]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01226144 0.18601222 0.05473867 0.0760963 ]\n",
      "2= tensor([[-0.1150, -0.2000]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01598168 -0.00984998  0.0562606   0.3855347 ]\n",
      "2= tensor([[0.0246, 0.1689]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01578468 0.18443002 0.06397129 0.11110769]\n",
      "2= tensor([[-0.1024, -0.1635]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01947328 -0.0115475   0.06619345  0.4232674 ]\n",
      "2= tensor([[0.0344, 0.1902]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01924234 0.18257733 0.07465879 0.15216452]\n",
      "2= tensor([[-0.0883, -0.1218]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02289388 -0.01352985  0.07770208  0.46743515]\n",
      "2= tensor([[0.0447, 0.2122]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02262328 0.18041326 0.08705079 0.20021969]\n",
      "2= tensor([[-0.0718, -0.0729]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02623155 -0.01583889  0.09105518  0.51904386]\n",
      "2= tensor([[0.0540, 0.2330]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02591477 0.1778911  0.10143606 0.25638595]\n",
      "2= tensor([[-0.0505, -0.0241]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02947259  0.37142956  0.10656378 -0.00265838]\n",
      "2= tensor([[-0.1844, -0.4089]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03690118 0.1749535  0.10651061 0.3216544 ]\n",
      "2= tensor([[-0.0310,  0.0249]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04040026 0.3684102  0.11294369 0.06436872]\n",
      "2= tensor([[-0.1615, -0.3389]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04776846 0.17186534 0.11423107 0.39044252]\n",
      "2= tensor([[-0.0088,  0.0777]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05120577 0.36519644 0.12203992 0.13584682]\n",
      "2= tensor([[-0.1373, -0.2656]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0585097  0.168557   0.12475686 0.4644029 ]\n",
      "2= tensor([[0.0147, 0.1328]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06188083 0.3617156  0.13404492 0.2135003 ]\n",
      "2= tensor([[-0.1103, -0.1854]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06911515 0.16495728 0.13831492 0.5452815 ]\n",
      "2= tensor([[0.0310, 0.1798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07241429 0.35789245 0.14922056 0.29917774]\n",
      "2= tensor([[-0.0770, -0.1026]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07957214 0.5506073  0.1552041  0.05702604]\n",
      "2= tensor([[-0.2129, -0.4812]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09058429 0.35363993 0.15634462 0.3943728 ]\n",
      "2= tensor([[-0.0412, -0.0253]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09765708 0.546238   0.16423208 0.15477766]\n",
      "2= tensor([[-0.1795, -0.3842]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10858185 0.34919205 0.16732764 0.49443692]\n",
      "2= tensor([[-0.0083,  0.0482]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11556569 0.54160804 0.17721638 0.25880915]\n",
      "2= tensor([[-0.1400, -0.2774]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12639785 0.34445727 0.18239255 0.601733  ]\n",
      "2= tensor([[0.0201, 0.1173]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.133287   0.5366225  0.19442722 0.37159303]\n",
      "2= tensor([[-0.0929, -0.1673]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.14401944 0.7285277  0.20185907 0.14596105]\n",
      "2= tensor([[-0.2253, -0.5229]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.15859    0.53117347 0.2047783  0.49492607]\n",
      "2= tensor([[-0.0452, -0.0648]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0360976   0.03685294  0.02680914  0.02530466]\n",
      "2= tensor([[-0.0949, -0.1406]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03536054 -0.15864302  0.02731523  0.32632416]\n",
      "2= tensor([[0.0385, 0.1954]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0385334  -0.354143    0.03384171  0.62749445]\n",
      "2= tensor([[0.1058, 0.3391]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04561626 -0.15950933  0.0463916   0.34565863]\n",
      "2= tensor([[0.0445, 0.2096]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04880645  0.03492306  0.05330478  0.06795808]\n",
      "2= tensor([[-0.0769, -0.0906]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04810799 -0.16092099  0.05466394  0.3769711 ]\n",
      "2= tensor([[0.0528, 0.2271]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05132641  0.03338369  0.06220336  0.1020126 ]\n",
      "2= tensor([[-0.0649, -0.0541]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05065873  0.22756158  0.06424361 -0.17041492]\n",
      "2= tensor([[-0.2025, -0.4687]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0461075   0.03158174  0.06083531  0.14182304]\n",
      "2= tensor([[-0.0530, -0.0170]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04547586  0.22578204  0.06367178 -0.13106398]\n",
      "2= tensor([[-0.1900, -0.4278]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04096022  0.02980853  0.06105049  0.18100746]\n",
      "2= tensor([[-0.0416,  0.0148]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04036405  0.22400616  0.06467064 -0.09180859]\n",
      "2= tensor([[-0.1767, -0.3854]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03588393  0.02801974  0.06283447  0.22055641]\n",
      "2= tensor([[-0.0289,  0.0454]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03532353  0.22218989  0.0672456  -0.05166285]\n",
      "2= tensor([[-0.1623, -0.3417]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03087974  0.02617137  0.06621234  0.26145568]\n",
      "2= tensor([[-0.0154,  0.0769]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03035631  0.22028875  0.07144146 -0.00963014]\n",
      "2= tensor([[-0.1470, -0.2963]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02595053  0.02421881  0.07124885  0.30471048]\n",
      "2= tensor([[-0.0017,  0.1095]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02546616  0.2182569   0.07734306  0.03532124]\n",
      "2= tensor([[-0.1308, -0.2483]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02110102  0.02211593  0.07804949  0.35136935]\n",
      "2= tensor([[0.0110, 0.1422]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0206587  -0.17402418  0.08507688  0.6676071 ]\n",
      "2= tensor([[0.0929, 0.3217]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02413919  0.01981805  0.09842902  0.40287784]\n",
      "2= tensor([[0.0254, 0.1790]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02374282  0.21341625  0.10648657  0.14277756]\n",
      "2= tensor([[-0.0918, -0.1324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0194745   0.01694316  0.10934213  0.46706578]\n",
      "2= tensor([[0.0406, 0.2132]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01913564  0.21036415  0.11868344  0.2107495 ]\n",
      "2= tensor([[-0.0686, -0.0637]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01492835  0.40360683  0.12289843 -0.04226438]\n",
      "2= tensor([[-0.1988, -0.4519]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00685622  0.20695649  0.12205314  0.28652754]\n",
      "2= tensor([[-0.0442, -0.0042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00271709  0.40014556  0.12778369  0.03469429]\n",
      "2= tensor([[-0.1742, -0.3741]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00528582 0.20344478 0.12847757 0.3648061 ]\n",
      "2= tensor([[-0.0200,  0.0554]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.00935472 0.3965291  0.1357737  0.11523528]\n",
      "2= tensor([[-0.1470, -0.2904]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0172853  0.19974935 0.1380784  0.44748336]\n",
      "2= tensor([[0.0066, 0.1182]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.02128029 0.39267558 0.14702807 0.20131451]\n",
      "2= tensor([[-0.1176, -0.2018]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0291338  0.19579028 0.15105437 0.5365268 ]\n",
      "2= tensor([[0.0263, 0.1724]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03304961 0.38850164 0.1617849  0.29499266]\n",
      "2= tensor([[-0.0819, -0.1093]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04081964 0.19148745 0.16768475 0.6340124 ]\n",
      "2= tensor([[0.0428, 0.2185]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04464939 0.3839226  0.180365   0.39847693]\n",
      "2= tensor([[-0.0412, -0.0223]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05232784 0.5760889  0.18833454 0.16764367]\n",
      "2= tensor([[-0.1746, -0.3687]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06384962 0.37884042 0.1916874  0.5133282 ]\n",
      "2= tensor([[-0.0046,  0.0610]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07142643 0.57081926 0.20195398 0.28664595]\n",
      "2= tensor([[-0.1301, -0.2485]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08284281 0.37347615 0.2076869  0.63561624]\n",
      "2= tensor([[0.0234, 0.1320]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03335689 -0.0100943   0.00847706  0.03988858]\n",
      "2= tensor([[-0.0882, -0.1263]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03315501 -0.20533678  0.00927483  0.33523402]\n",
      "2= tensor([[0.0457, 0.1988]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02904827 -0.01034804  0.01597952  0.04549025]\n",
      "2= tensor([[-0.0849, -0.1180]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02884131 -0.20569545  0.01688932  0.34317172]\n",
      "2= tensor([[0.0483, 0.2046]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0247274  -0.01081779  0.02375275  0.05586215]\n",
      "2= tensor([[-0.0802, -0.1050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02451104 -0.20627213  0.02487     0.3559436 ]\n",
      "2= tensor([[0.0520, 0.2131]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0203856  -0.01151244  0.03198887  0.07120544]\n",
      "2= tensor([[-0.0741, -0.0872]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02015535 -0.20707804  0.03341298  0.3738069 ]\n",
      "2= tensor([[0.0571, 0.2235]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01601379 -0.01244627  0.04088912  0.09184378]\n",
      "2= tensor([[-0.0662, -0.0639]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01576486  0.18206649  0.04272599 -0.18766342]\n",
      "2= tensor([[-0.2075, -0.4885]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01940619 -0.01363989  0.03897272  0.11818584]\n",
      "2= tensor([[-0.0583, -0.0386]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0191334   0.18090263  0.04133644 -0.16195126]\n",
      "2= tensor([[-0.1989, -0.4607]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02275145 -0.01478596  0.03809742  0.14348033]\n",
      "2= tensor([[-0.0506, -0.0154]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02245573  0.17977026  0.04096702 -0.13694431]\n",
      "2= tensor([[-0.1905, -0.4336]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02605114 -0.0159138   0.03822814  0.16837643]\n",
      "2= tensor([[-0.0426,  0.0050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02573286  0.17864071  0.04159566 -0.11200577]\n",
      "2= tensor([[-0.1820, -0.4067]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02930567 -0.01705184  0.03935555  0.19350474]\n",
      "2= tensor([[-0.0345,  0.0240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02896464 -0.21271402  0.04322564  0.49833828]\n",
      "2= tensor([[0.0822, 0.2752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02471036 -0.01822732  0.05319241  0.21958512]\n",
      "2= tensor([[-0.0246,  0.0473]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02434581  0.17609552  0.05758411 -0.05585568]\n",
      "2= tensor([[-0.1592, -0.3409]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02786772 -0.01980279  0.056467    0.2544251 ]\n",
      "2= tensor([[-0.0130,  0.0745]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02747166  0.17446935  0.0615555  -0.01992616]\n",
      "2= tensor([[-0.1459, -0.3017]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03096105 -0.02147889  0.06115698  0.29152542]\n",
      "2= tensor([[-0.0004,  0.1034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03053147 0.17272015 0.06698748 0.01874038]\n",
      "2= tensor([[-0.1317, -0.2602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03398588 -0.02329534  0.06736229  0.33178377]\n",
      "2= tensor([[0.0121, 0.1328]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03351997 0.17080633 0.07399797 0.06108112]\n",
      "2= tensor([[-0.1166, -0.2156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0369361  -0.02529429  0.07521959  0.37616265]\n",
      "2= tensor([[0.0245, 0.1644]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03643021 0.16868319 0.08274284 0.10811289]\n",
      "2= tensor([[-0.1000, -0.1657]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03980387 -0.027521    0.0849051   0.42571092]\n",
      "2= tensor([[0.0374, 0.1932]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.03925345 0.16630213 0.09341932 0.16095565]\n",
      "2= tensor([[-0.0816, -0.1105]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0425795  -0.03002444  0.09663843  0.48158678]\n",
      "2= tensor([[0.0497, 0.2199]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04197901 0.16361012 0.10627017 0.22085765]\n",
      "2= tensor([[-0.0606, -0.0518]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04525121 -0.03285768  0.11068732  0.54508144]\n",
      "2= tensor([[0.0604, 0.2452]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04459406 0.16054913 0.12158895 0.28922227]\n",
      "2= tensor([[-0.0370,  0.0053]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04780504 0.35374638 0.1273734  0.03722503]\n",
      "2= tensor([[-0.1664, -0.3618]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05487997 0.15704983 0.12811789 0.3672263 ]\n",
      "2= tensor([[-0.0130,  0.0649]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05802096 0.3501406  0.13546242 0.11752769]\n",
      "2= tensor([[-0.1392, -0.2787]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.06502377 0.153364   0.13781297 0.44969282]\n",
      "2= tensor([[0.0137, 0.1278]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06809106 0.34629512 0.14680684 0.20342885]\n",
      "2= tensor([[-0.1096, -0.1893]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07501696 0.14941204 0.1508754  0.5385831 ]\n",
      "2= tensor([[0.0323, 0.1811]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0780052  0.34212688 0.16164707 0.296984  ]\n",
      "2= tensor([[-0.0735, -0.0968]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.08484773 0.1451141  0.16758674 0.63596815]\n",
      "2= tensor([[0.0483, 0.2265]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08775002 0.33755141 0.1803061  0.40039644]\n",
      "2= tensor([[-0.0335, -0.0099]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09450105 0.52971905 0.18831404 0.1695411 ]\n",
      "2= tensor([[-0.1677, -0.3567]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10509543 0.33247083 0.19170487 0.51522046]\n",
      "2= tensor([[0.0028, 0.0732]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11174484 0.5244497  0.20200928 0.28854412]\n",
      "2= tensor([[-0.1220, -0.2333]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12223384 0.32710642 0.20778015 0.63752735]\n",
      "2= tensor([[0.0301, 0.1429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.03028348  0.00954747 -0.04622903  0.00245525]\n",
      "2= tensor([[-0.1113, -0.1786]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03047442 -0.18488206 -0.04617993  0.28020146]\n",
      "2= tensor([[0.0253, 0.1571]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02677678  0.01086718 -0.0405759  -0.02668144]\n",
      "2= tensor([[-0.1204, -0.2085]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02699413 -0.18365009 -0.04110953  0.2529283 ]\n",
      "2= tensor([[0.0181, 0.1404]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02332113  0.01203401 -0.03605096 -0.05243269]\n",
      "2= tensor([[-0.1285, -0.2350]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02356181 -0.18255296 -0.03709962  0.22866143]\n",
      "2= tensor([[0.0114, 0.1250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01991075  0.01307898 -0.03252639 -0.07548933]\n",
      "2= tensor([[-0.1362, -0.2597]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02017233 -0.18156195 -0.03403617  0.20675655]\n",
      "2= tensor([[0.0052, 0.1110]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01654109  0.01402977 -0.02990104 -0.0964658 ]\n",
      "2= tensor([[-0.1432, -0.2820]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01682168 -0.18065116 -0.03183036  0.18663545]\n",
      "2= tensor([[-0.0004,  0.0981]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01320866  0.01491141 -0.02809765 -0.11591635]\n",
      "2= tensor([[-0.1497, -0.3027]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01350689 -0.17979692 -0.03041598  0.16777124]\n",
      "2= tensor([[-0.0054,  0.0848]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00991095  0.01574691 -0.02706055 -0.13434975]\n",
      "2= tensor([[-0.1560, -0.3227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01022589 -0.17897719 -0.02974755  0.14967462]\n",
      "2= tensor([[-0.0106,  0.0718]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00664634  0.01655782 -0.02675406 -0.15224262]\n",
      "2= tensor([[-0.1620, -0.3417]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0069775  -0.17817102 -0.02979891  0.13188137]\n",
      "2= tensor([[-0.0161,  0.0588]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00341408  0.01736482 -0.02716128 -0.17005178]\n",
      "2= tensor([[-0.1679, -0.3606]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00376138 -0.17735805 -0.03056232  0.11394036]\n",
      "2= tensor([[-0.0216,  0.0452]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00021421  0.0181882  -0.02828351 -0.18822594]\n",
      "2= tensor([[-0.1740, -0.3798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00057798 -0.17651793 -0.03204803  0.09540219]\n",
      "2= tensor([[-0.0273,  0.0311]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00295238  0.01904835 -0.03013998 -0.2072171 ]\n",
      "2= tensor([[-0.1805, -0.4000]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00257141 -0.17562994 -0.03428433  0.07580789]\n",
      "2= tensor([[-0.0333,  0.0161]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00608401  0.0199663  -0.03276817 -0.22749168]\n",
      "2= tensor([[-0.1875, -0.4217]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00568469 -0.17467241 -0.037318    0.05467753]\n",
      "2= tensor([[-0.0401, -0.0033]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00917813  0.02096421 -0.03622445 -0.24954201]\n",
      "2= tensor([[-0.1951, -0.4453]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00875885 -0.1736222  -0.04121529  0.03149847]\n",
      "2= tensor([[-0.0484, -0.0257]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01223129  0.02206581 -0.04058532 -0.27389815]\n",
      "2= tensor([[-0.2037, -0.4715]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01178998 -0.17245427 -0.04606329  0.00571288]\n",
      "2= tensor([[-0.0578, -0.0519]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01523906  0.023297   -0.04594903 -0.30114037]\n",
      "2= tensor([[-0.2133, -0.5016]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01477312 -0.17114095 -0.05197183 -0.02329554]\n",
      "2= tensor([[-0.0685, -0.0818]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01819594 -0.36548054 -0.05243775  0.2525474 ]\n",
      "2= tensor([[0.0562, 0.2082]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02550555 -0.16965057 -0.0473868  -0.05620344]\n",
      "2= tensor([[-0.0781, -0.1125]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02889857 -0.36406216 -0.04851087  0.2211601 ]\n",
      "2= tensor([[0.0495, 0.1949]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03617981 -0.16828158 -0.04408767 -0.08642189]\n",
      "2= tensor([[-0.0868, -0.1403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03954544 -0.36274475 -0.0458161   0.19203185]\n",
      "2= tensor([[0.0424, 0.1811]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04680033 -0.16699834 -0.04197546 -0.11474487]\n",
      "2= tensor([[-0.0951, -0.1662]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0501403  -0.36149448 -0.04427036  0.16440521]\n",
      "2= tensor([[0.0352, 0.1669]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05737019 -0.16576768 -0.04098226 -0.14190859]\n",
      "2= tensor([[-0.1030, -0.1910]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06068555 -0.36027947 -0.04382043  0.13756868]\n",
      "2= tensor([[0.0278, 0.1525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06789114 -0.16455816 -0.04106906 -0.16861053]\n",
      "2= tensor([[-0.1116, -0.2179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0711823  -0.35906893 -0.04444127  0.1108387 ]\n",
      "2= tensor([[0.0204, 0.1372]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07836368 -0.16333927 -0.04222449 -0.19552736]\n",
      "2= tensor([[-0.1202, -0.2463]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08163046 -0.35783258 -0.04613504  0.08354229]\n",
      "2= tensor([[0.0129, 0.1213]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08878712 -0.16208072 -0.0444642  -0.22333199]\n",
      "2= tensor([[-0.1293, -0.2758]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09202873  0.03364762 -0.04893083 -0.5297025 ]\n",
      "2= tensor([[-0.2901, -0.7465]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09135578 -0.16075307 -0.05952489 -0.2528304 ]\n",
      "2= tensor([[-0.1401, -0.3100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09457084 -0.35497677 -0.06458149  0.02049922]\n",
      "2= tensor([[-0.0049,  0.0810]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10167037 -0.15899096 -0.06417151 -0.29184043]\n",
      "2= tensor([[-0.1528, -0.3517]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1048502   0.03698448 -0.07000832 -0.604052  ]\n",
      "2= tensor([[-0.3252, -0.8446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1041105  -0.15709214 -0.08208936 -0.33421582]\n",
      "2= tensor([[-0.1699, -0.4033]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10725234 -0.35095567 -0.08877368 -0.06850696]\n",
      "2= tensor([[-0.0298,  0.0100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11427145 -0.15468052 -0.09014381 -0.38782552]\n",
      "2= tensor([[-0.1927, -0.4700]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11736507  0.04159763 -0.09790032 -0.70751375]\n",
      "2= tensor([[-0.3769, -0.9842]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11653312 -0.15204161 -0.1120506  -0.44718248]\n",
      "2= tensor([[-0.2226, -0.5534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11957395 -0.3454149  -0.12099425 -0.1918155 ]\n",
      "2= tensor([[-0.0758, -0.1286]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12648225 -0.5386169  -0.12483056  0.0603832 ]\n",
      "2= tensor([[0.0402, 0.1631]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13725458 -0.34194675 -0.12362289 -0.26893145]\n",
      "2= tensor([[-0.1083, -0.2232]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14409351 -0.14529736 -0.12900153 -0.59790707]\n",
      "2= tensor([[-0.2939, -0.7566]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14699946 -0.33840075 -0.14095967 -0.34848014]\n",
      "2= tensor([[-0.1428, -0.3251]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.15376748 -0.5312659  -0.14792927 -0.1033568 ]\n",
      "2= tensor([[-0.0088,  0.0478]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1643928  -0.33436775 -0.1499964  -0.4388111 ]\n",
      "2= tensor([[-0.1839, -0.4442]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.17108016 -0.5270838  -0.15877262 -0.19691658]\n",
      "2= tensor([[-0.0464, -0.0455]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.18162183 -0.33008924 -0.16271095 -0.5351751 ]\n",
      "2= tensor([[-0.2296, -0.5736]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18822362 -0.5225943  -0.17341445 -0.29785773]\n",
      "2= tensor([[-0.0899, -0.1720]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1986755  -0.7148748  -0.17937161 -0.06449153]\n",
      "2= tensor([[0.0297, 0.1211]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.212973   -0.5176952  -0.18066144 -0.40796855]\n",
      "2= tensor([[-0.1378, -0.3142]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.2233269  -0.70985746 -0.18882081 -0.17724234]\n",
      "2= tensor([[-0.0157,  0.0296]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.23752405 -0.51260567 -0.19236566 -0.5230451 ]\n",
      "2= tensor([[-0.1934, -0.4702]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.24777617 -0.70457405 -0.20282656 -0.29661137]\n",
      "2= tensor([[-0.0647, -0.0936]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.26186764 -0.89631426 -0.20875879 -0.07411969]\n",
      "2= tensor([[0.0518, 0.1515]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01214022 -0.00892124 -0.04912633 -0.04214573]\n",
      "2= tensor([[-0.1195, -0.2072]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0119618  -0.20330557 -0.04996924  0.23464166]\n",
      "2= tensor([[0.0178, 0.1392]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00789569 -0.00750661 -0.04527641 -0.07337503]\n",
      "2= tensor([[-0.1298, -0.2393]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00774555 -0.2019512  -0.04674391  0.20468625]\n",
      "2= tensor([[0.0093, 0.1200]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00370653 -0.00619304 -0.04265018 -0.10236797]\n",
      "2= tensor([[-0.1397, -0.2703]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00358267 -0.20067863 -0.04469754  0.17655978]\n",
      "2= tensor([[0.0014, 0.1020]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0004309  -0.00494646 -0.04116635 -0.12988195]\n",
      "2= tensor([[-0.1495, -0.3004]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00052983 -0.19945526 -0.04376398  0.14953458]\n",
      "2= tensor([[-0.0061,  0.0838]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00451894 -0.00373484 -0.04077329 -0.15662746]\n",
      "2= tensor([[-0.1585, -0.3291]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00459363 -0.19825001 -0.04390584  0.12291878]\n",
      "2= tensor([[-0.0135,  0.0646]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00855864 -0.00252744 -0.04144747 -0.18328632]\n",
      "2= tensor([[-0.1676, -0.3576]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00860918 -0.19703257 -0.04511319  0.09603874]\n",
      "2= tensor([[-0.0219,  0.0443]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01254984 -0.00129404 -0.04319242 -0.2105291 ]\n",
      "2= tensor([[-0.1769, -0.3868]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01257572  0.19441801 -0.047403   -0.516518  ]\n",
      "2= tensor([[-0.3235, -0.8458]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-8.6873565e-03 -5.5191836e-06 -5.7733361e-02 -2.3914158e-01]\n",
      "2= tensor([[-0.1883, -0.4205]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00868747 -0.19425723 -0.06251619  0.03478633]\n",
      "2= tensor([[-0.0437, -0.0122]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01257261  0.00170293 -0.06182047 -0.27694747]\n",
      "2= tensor([[-0.2015, -0.4624]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01253855 -0.19248508 -0.06735942 -0.00438554]\n",
      "2= tensor([[-0.0577, -0.0519]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01638825  0.00353501 -0.06744713 -0.31753758]\n",
      "2= tensor([[-0.2156, -0.5085]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01631755 -0.1905647  -0.07379788 -0.04686441]\n",
      "2= tensor([[-0.0732, -0.0960]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02012885 -0.3845551  -0.07473516  0.22165231]\n",
      "2= tensor([[0.0522, 0.1965]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02781995 -0.18844892 -0.07030212 -0.09363758]\n",
      "2= tensor([[-0.0877, -0.1413]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03158893 -0.3824965  -0.07217487  0.17606299]\n",
      "2= tensor([[0.0412, 0.1739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03923886 -0.18641983 -0.06865361 -0.13848728]\n",
      "2= tensor([[-0.1016, -0.1849]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04296726 -0.38049474 -0.07142336  0.13177098]\n",
      "2= tensor([[0.0292, 0.1493]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05057715 -0.18442622 -0.06878794 -0.18256257]\n",
      "2= tensor([[-0.1157, -0.2311]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05426567 -0.3784999  -0.07243919  0.08765178]\n",
      "2= tensor([[0.0169, 0.1226]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06183567 -0.18241839 -0.07068615 -0.22697762]\n",
      "2= tensor([[-0.1306, -0.2800]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06548404 -0.3764627  -0.0752257   0.04259755]\n",
      "2= tensor([[0.0042, 0.0950]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07301329 -0.18034716 -0.07437375 -0.2728393 ]\n",
      "2= tensor([[-0.1451, -0.3291]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07662024 -0.37433344 -0.07983054 -0.00451003]\n",
      "2= tensor([[-0.0096,  0.0646]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08410691 -0.17816274 -0.07992074 -0.3212742 ]\n",
      "2= tensor([[-0.1620, -0.3833]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08767016 -0.37206098 -0.08634622 -0.05482687]\n",
      "2= tensor([[-0.0230,  0.0267]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09511138 -0.1758139  -0.08744276 -0.37345508]\n",
      "2= tensor([[-0.1833, -0.4464]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09862766  0.02043432 -0.09491187 -0.69237816]\n",
      "2= tensor([[-0.3674, -0.9612]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09821897 -0.17325166 -0.10875943 -0.43101898]\n",
      "2= tensor([[-0.2116, -0.5259]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.101684   -0.366679   -0.11737981 -0.17450449]\n",
      "2= tensor([[-0.0656, -0.1023]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10901759 -0.55994254 -0.1208699   0.07896549]\n",
      "2= tensor([[0.0483, 0.1772]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12021644 -0.36331388 -0.11929059 -0.24927491]\n",
      "2= tensor([[-0.0965, -0.1914]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12748271 -0.5565482  -0.12427609  0.00352833]\n",
      "2= tensor([[0.0281, 0.1325]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13861367 -0.3598833  -0.12420552 -0.325637  ]\n",
      "2= tensor([[-0.1283, -0.2856]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14581135 -0.5530381  -0.13071826 -0.07455936]\n",
      "2= tensor([[0.0051, 0.0773]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.15687211 -0.35630807 -0.13220945 -0.4054587 ]\n",
      "2= tensor([[-0.1636, -0.3888]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.16399826 -0.54933167 -0.14031862 -0.1572065 ]\n",
      "2= tensor([[-0.0262,  0.0044]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1749849  -0.35250872 -0.14346275 -0.49065763]\n",
      "2= tensor([[-0.2025, -0.5015]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18203507 -0.5453465  -0.1532759  -0.24640608]\n",
      "2= tensor([[-0.0620, -0.0943]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.19294201 -0.73798496 -0.15820402 -0.00572289]\n",
      "2= tensor([[0.0522, 0.1705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.2077017  -0.5409896  -0.15831849 -0.343844  ]\n",
      "2= tensor([[-0.1045, -0.2176]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.21852149 -0.73354673 -0.16519536 -0.10497194]\n",
      "2= tensor([[0.0194, 0.0993]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.23319243 -0.5364902  -0.1672948  -0.4448796 ]\n",
      "2= tensor([[-0.1485, -0.3473]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.24392223 -0.7288992  -0.17619239 -0.20925103]\n",
      "2= tensor([[-0.0244,  0.0091]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.25850022 -0.53175306 -0.18037741 -0.55192494]\n",
      "2= tensor([[-0.2025, -0.4971]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.26913527 -0.7239446  -0.1914159  -0.32105866]\n",
      "2= tensor([[-0.0706, -0.1100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.28361416 -0.9158987  -0.19783708 -0.0943196 ]\n",
      "2= tensor([[0.0488, 0.1448]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.30193216 -0.7185724  -0.19972348 -0.44232088]\n",
      "2= tensor([[-0.1262, -0.2665]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.31630358 -0.910391   -0.2085699  -0.21864168]\n",
      "2= tensor([[-0.0026,  0.0448]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "0 413 -946.9\n",
      "1= [-0.02730591 -0.04814195 -0.0074833   0.00323313]\n",
      "2= tensor([[-0.0844, -0.1170]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02826875 -0.24315579 -0.00741864  0.29354563]\n",
      "2= tensor([[0.0457, 0.2016]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03313187 -0.04792885 -0.00154773 -0.00146777]\n",
      "2= tensor([[-0.0848, -0.1193]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03409044 -0.24302858 -0.00157708  0.29072642]\n",
      "2= tensor([[0.0455, 0.2017]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03895102 -0.04788417  0.00423745 -0.00245348]\n",
      "2= tensor([[-0.0840, -0.1179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0399087   0.14717676  0.00418838 -0.29379642]\n",
      "2= tensor([[-0.2326, -0.5602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03696517 -0.04800466 -0.00168755  0.0002045 ]\n",
      "2= tensor([[-0.0838, -0.1162]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03792526 -0.24310237 -0.00168346  0.2923545 ]\n",
      "2= tensor([[0.0462, 0.2035]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04278731 -0.04795646  0.00416363 -0.00085889]\n",
      "2= tensor([[-0.0830, -0.1148]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04374643 -0.24313787  0.00414645  0.2931348 ]\n",
      "2= tensor([[0.0468, 0.2055]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04860919 -0.04807528  0.01000915  0.00176249]\n",
      "2= tensor([[-0.0811, -0.1097]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0495707  -0.24333934  0.01004439  0.29758653]\n",
      "2= tensor([[0.0484, 0.2096]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05443748 -0.048362    0.01599613  0.00808829]\n",
      "2= tensor([[-0.0779, -0.1007]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05540472 -0.24370967  0.01615789  0.30577496]\n",
      "2= tensor([[0.0509, 0.2154]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06027891 -0.4390581   0.02227339  0.60350955]\n",
      "2= tensor([[0.1127, 0.3446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06906008 -0.24425463  0.03434358  0.31792468]\n",
      "2= tensor([[0.0543, 0.2244]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07394517 -0.04963823  0.04070207  0.03626725]\n",
      "2= tensor([[-0.0645, -0.0633]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07493793  0.14487712  0.04142742 -0.24330102]\n",
      "2= tensor([[-0.2077, -0.4880]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07204039  0.3393836   0.0365614  -0.5226342 ]\n",
      "2= tensor([[-0.3391, -0.8986]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06525272  0.14376664  0.02610872 -0.21865822]\n",
      "2= tensor([[-0.2019, -0.4651]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06237739 -0.05171861  0.02173555  0.0821448 ]\n",
      "2= tensor([[-0.0523, -0.0218]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06341176  0.14308512  0.02337845 -0.20360203]\n",
      "2= tensor([[-0.1970, -0.4486]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06055006 -0.05236322  0.01930641  0.09636302]\n",
      "2= tensor([[-0.0480, -0.0086]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06159732  0.14247678  0.02123367 -0.19016679]\n",
      "2= tensor([[-0.1927, -0.4341]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05874779 -0.05294241  0.01743033  0.10913814]\n",
      "2= tensor([[-0.0445,  0.0026]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05980663  0.14192548  0.01961309 -0.17799504]\n",
      "2= tensor([[-0.1887, -0.4209]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05696813 -0.05347157  0.01605319  0.12081005]\n",
      "2= tensor([[-0.0411,  0.0117]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05803756  0.14141676  0.0184694  -0.16676533]\n",
      "2= tensor([[-0.1850, -0.4089]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05520922 -0.05396464  0.01513409  0.13168646]\n",
      "2= tensor([[-0.0377,  0.0198]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05628851  0.14093728  0.01776782 -0.15618369]\n",
      "2= tensor([[-0.1815, -0.3976]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05346977 -0.05443449  0.01464414  0.14205118]\n",
      "2= tensor([[-0.0345,  0.0276]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05455846  0.1404747   0.01748517 -0.14597604]\n",
      "2= tensor([[-0.1782, -0.3867]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05174896 -0.05489323  0.01456565  0.15217143]\n",
      "2= tensor([[-0.0315,  0.0352]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05284683  0.14001717  0.01760907 -0.13588099]\n",
      "2= tensor([[-0.1748, -0.3759]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05004648 -0.05535252  0.01489145  0.16230491]\n",
      "2= tensor([[-0.0284,  0.0429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05115354  0.13955311  0.01813755 -0.1256432 ]\n",
      "2= tensor([[-0.1713, -0.3650]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04836247 -0.05582392  0.01562469  0.17270629]\n",
      "2= tensor([[-0.0252,  0.0508]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04947895  0.13907096  0.01907882 -0.11500687]\n",
      "2= tensor([[-0.1677, -0.3537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04669753 -0.05631909  0.01677868  0.1836337 ]\n",
      "2= tensor([[-0.0218,  0.0592]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04782391  0.13855882  0.02045135 -0.10370931]\n",
      "2= tensor([[-0.1638, -0.3416]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04505274  0.3333818   0.01837717 -0.3898704 ]\n",
      "2= tensor([[-0.3000, -0.7659]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0383851   0.1380039   0.01057976 -0.09145046]\n",
      "2= tensor([[-0.1613, -0.3313]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03562503 -0.05726808  0.00875075  0.20455152]\n",
      "2= tensor([[-0.0166,  0.0721]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03677038  0.13772765  0.01284178 -0.08535818]\n",
      "2= tensor([[-0.1590, -0.3250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03401583 -0.05757601  0.01113462  0.21134852]\n",
      "2= tensor([[-0.0144,  0.0771]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03516736  0.13738498  0.01536159 -0.07780133]\n",
      "2= tensor([[-0.1561, -0.3167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03241966  0.33228338  0.01380556 -0.36559832]\n",
      "2= tensor([[-0.2941, -0.7455]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02577399  0.13696799  0.00649359 -0.06859444]\n",
      "2= tensor([[-0.1546, -0.3100]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02303463 -0.05824645  0.0051217   0.22613016]\n",
      "2= tensor([[-0.0110,  0.0849]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02419955  0.13680193  0.00964431 -0.06493281]\n",
      "2= tensor([[-0.1530, -0.3063]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02146352 -0.05845696  0.00834565  0.2307773 ]\n",
      "2= tensor([[-0.0095,  0.0882]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02263266  0.13654475  0.0129612  -0.05926149]\n",
      "2= tensor([[-0.1507, -0.3002]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01990176 -0.05876062  0.01177597  0.23748243]\n",
      "2= tensor([[-0.0076,  0.0930]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02107697 -0.2540488   0.01652562  0.53385645]\n",
      "2= tensor([[0.0912, 0.3003]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02615795 -0.05916312  0.02720274  0.24642615]\n",
      "2= tensor([[-0.0041,  0.1024]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02734121  0.13555998  0.03213127 -0.0375538 ]\n",
      "2= tensor([[-0.1400, -0.2727]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02463001 -0.06000766  0.03138019  0.2650912 ]\n",
      "2= tensor([[0.0014, 0.1164]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02583016  0.13465267  0.03668202 -0.01753129]\n",
      "2= tensor([[-0.1326, -0.2507]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02313711 -0.06097561  0.03633139  0.28649583]\n",
      "2= tensor([[0.0076, 0.1321]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02435662  0.13360988  0.04206131  0.00548929]\n",
      "2= tensor([[-0.1243, -0.2263]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02168443 -0.06208926  0.04217109  0.31114075]\n",
      "2= tensor([[0.0148, 0.1498]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02292621  0.1324073   0.04839391  0.03204992]\n",
      "2= tensor([[-0.1146, -0.1981]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02027807 -0.06337404  0.0490349   0.33960035]\n",
      "2= tensor([[0.0235, 0.1687]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02154555  0.13101715  0.05582691  0.06277455]\n",
      "2= tensor([[-0.1033, -0.1655]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0189252   0.32529607  0.0570824  -0.21178526]\n",
      "2= tensor([[-0.2409, -0.5835]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01241928  0.12940641  0.0528467   0.09834378]\n",
      "2= tensor([[-0.0924, -0.1318]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00983115 -0.06643155  0.05481357  0.4072203 ]\n",
      "2= tensor([[0.0417, 0.2055]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01115979  0.12787206  0.06295798  0.13230976]\n",
      "2= tensor([[-0.0802, -0.0969]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00860234 -0.06809258  0.06560417  0.4441718 ]\n",
      "2= tensor([[0.0505, 0.2239]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0099642   0.12604277  0.07448761  0.17286897]\n",
      "2= tensor([[-0.0657, -0.0556]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00744334  0.32002398  0.07794499 -0.09541688]\n",
      "2= tensor([[-0.2015, -0.4623]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00104286  0.12387641  0.07603665  0.22080378]\n",
      "2= tensor([[-0.0496, -0.0156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00143467  0.3178338   0.08045273 -0.04695843]\n",
      "2= tensor([[-0.1859, -0.4123]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00779134 0.1216559  0.07951356 0.2699842 ]\n",
      "2= tensor([[-0.0351,  0.0212]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01022446 0.31555843 0.08491325 0.0034017 ]\n",
      "2= tensor([[-0.1685, -0.3589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01653563 0.11932784 0.08498128 0.3216216 ]\n",
      "2= tensor([[-0.0189,  0.0609]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.01892219 0.31314328 0.09141371 0.056902  ]\n",
      "2= tensor([[-0.1501, -0.3031]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02518505  0.5068437   0.09255175 -0.20559727]\n",
      "2= tensor([[-0.2819, -0.7042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.03532193 0.3105285  0.08843981 0.11478663]\n",
      "2= tensor([[-0.1321, -0.2467]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0415325  0.11425796 0.09073554 0.43400922]\n",
      "2= tensor([[0.0146, 0.1403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.04381766 0.30798602 0.09941572 0.17125219]\n",
      "2= tensor([[-0.1127, -0.1889]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04997738 0.11159209 0.10284077 0.4935686 ]\n",
      "2= tensor([[0.0300, 0.1780]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.05220922 0.3051247  0.11271214 0.23498541]\n",
      "2= tensor([[-0.0906, -0.1248]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.05831171 0.10858791 0.11741184 0.5609872 ]\n",
      "2= tensor([[0.0414, 0.2105]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06048347 0.30188334 0.12863159 0.30748013]\n",
      "2= tensor([[-0.0619, -0.0608]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06652114 0.49496016 0.1347812  0.05797106]\n",
      "2= tensor([[-0.1991, -0.4400]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07642034 0.29818898 0.13594061 0.38995677]\n",
      "2= tensor([[-0.0331,  0.0037]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08238412 0.49114606 0.14373975 0.14303495]\n",
      "2= tensor([[-0.1700, -0.3539]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.09220704 0.29428938 0.14660046 0.4773889 ]\n",
      "2= tensor([[-0.0048,  0.0686]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.09809283 0.48707035 0.15614823 0.23426558]\n",
      "2= tensor([[-0.1373, -0.2609]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10783423 0.2901021  0.16083354 0.5718446 ]\n",
      "2= tensor([[0.0214, 0.1304]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.11363628 0.48264682 0.17227043 0.33383644]\n",
      "2= tensor([[-0.0960, -0.1628]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12328921 0.2855453  0.17894717 0.67550987]\n",
      "2= tensor([[0.0386, 0.1775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.12900013 0.4777889  0.19245736 0.44407934]\n",
      "2= tensor([[-0.0495, -0.0659]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.1385559  0.2805393  0.20133895 0.7907249 ]\n",
      "2= tensor([[0.0608, 0.2225]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04938978 -0.01421901  0.03619777  0.02611616]\n",
      "2= tensor([[-0.0907, -0.1445]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0491054  -0.20984086  0.03672009  0.32999656]\n",
      "2= tensor([[0.0457, 0.1953]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04490858 -0.01526035  0.04332002  0.04911581]\n",
      "2= tensor([[-0.0815, -0.1173]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04460337 -0.21097584  0.04430234  0.35514572]\n",
      "2= tensor([[0.0528, 0.2108]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04038386 -0.01651087  0.05140525  0.07675511]\n",
      "2= tensor([[-0.0711, -0.0861]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04005364  0.17783791  0.05294035 -0.19927646]\n",
      "2= tensor([[-0.2123, -0.5092]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0436104  -0.0179997   0.04895483  0.10962557]\n",
      "2= tensor([[-0.0610, -0.0534]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0432504   0.1763878   0.05114733 -0.16721939]\n",
      "2= tensor([[-0.2015, -0.4741]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04677816 -0.01942755  0.04780295  0.1411503 ]\n",
      "2= tensor([[-0.0513, -0.0238]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04638961  0.17497833  0.05062595 -0.13607669]\n",
      "2= tensor([[-0.1909, -0.4400]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04988918 -0.02083083  0.04790442  0.17213841]\n",
      "2= tensor([[-0.0412,  0.0032]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04947256  0.17357391  0.05134719 -0.10505567]\n",
      "2= tensor([[-0.1800, -0.4060]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05294404 -0.02224484  0.04924608  0.20337477]\n",
      "2= tensor([[-0.0314,  0.0269]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05249914  0.17213951  0.05331357 -0.07337576]\n",
      "2= tensor([[-0.1682, -0.3709]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05594193 -0.02370461  0.05184606  0.2356398 ]\n",
      "2= tensor([[-0.0207,  0.0521]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05546784  0.17063974  0.05655885 -0.04024911]\n",
      "2= tensor([[-0.1560, -0.3348]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05888063 -0.02524573  0.05575387  0.2697287 ]\n",
      "2= tensor([[-0.0093,  0.0788]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.05837572  0.1690381   0.06114844 -0.00486106]\n",
      "2= tensor([[-0.1428, -0.2961]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.06175648 -0.02690508  0.06105122  0.30647084]\n",
      "2= tensor([[0.0035, 0.1073]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06121838 0.16729617 0.06718064 0.03364957]\n",
      "2= tensor([[-0.1283, -0.2539]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0645643  -0.02872165  0.06785363  0.34674928]\n",
      "2= tensor([[0.0163, 0.1369]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06398987 0.16537283 0.07478862 0.07621119]\n",
      "2= tensor([[-0.1130, -0.2088]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.06729732 -0.03073716  0.07631284  0.39152125]\n",
      "2= tensor([[0.0284, 0.1682]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06668258 -0.2268545   0.08414327  0.7072553 ]\n",
      "2= tensor([[0.1021, 0.3333]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06214549 -0.03299278  0.09828837  0.44220045]\n",
      "2= tensor([[0.0420, 0.1996]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.06148564 0.16061094 0.10713238 0.18204677]\n",
      "2= tensor([[-0.0743, -0.0942]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.06469785 -0.03586788  0.11077332  0.50651205]\n",
      "2= tensor([[0.0543, 0.2278]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.0639805  0.15753311 0.12090356 0.2506894 ]\n",
      "2= tensor([[-0.0493, -0.0301]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.06713116  0.35073972  0.12591735 -0.00154582]\n",
      "2= tensor([[-0.1804, -0.4090]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.07414596 0.15405793 0.12588643 0.32806307]\n",
      "2= tensor([[-0.0256,  0.0293]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.07722712 0.34718394 0.13244769 0.07757941]\n",
      "2= tensor([[-0.1538, -0.3271]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0841708  0.15043646 0.13399927 0.4089417 ]\n",
      "2= tensor([[0.0006, 0.0918]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.08717952 0.34342936 0.14217812 0.1613255 ]\n",
      "2= tensor([[-0.1253, -0.2402]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.09404811  0.5362599   0.14540462 -0.08334211]\n",
      "2= tensor([[-0.2556, -0.6248]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.10477331 0.33938533 0.14373778 0.25145194]\n",
      "2= tensor([[-0.0944, -0.1493]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.11156102 0.14253463 0.14876682 0.5857965 ]\n",
      "2= tensor([[0.0402, 0.1975]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.1144117  0.33529416 0.16048275 0.34342715]\n",
      "2= tensor([[-0.0574, -0.0664]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.12111759 0.1382964  0.16735129 0.6821064 ]\n",
      "2= tensor([[0.0562, 0.2381]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.12388352 0.33074775 0.18099342 0.4464343 ]\n",
      "2= tensor([[-0.0185,  0.0177]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.13049847 0.5229097  0.18992211 0.21582171]\n",
      "2= tensor([[-0.1517, -0.3175]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.14095667 0.325652   0.19423854 0.56188995]\n",
      "2= tensor([[0.0154, 0.0987]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [0.1474697  0.51759404 0.20547634 0.33613884]\n",
      "2= tensor([[-0.1035, -0.1955]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04519052 -0.04240563 -0.01119908  0.03315898]\n",
      "2= tensor([[-0.0746, -0.0834]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04603864 -0.2373652  -0.0105359   0.32228753]\n",
      "2= tensor([[0.0518, 0.2173]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05078594 -0.04209482 -0.00409015  0.02630072]\n",
      "2= tensor([[-0.0756, -0.0881]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05162783 -0.23715788 -0.00356413  0.31769037]\n",
      "2= tensor([[0.0513, 0.2168]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05637099 -0.04198534  0.00278967  0.02388556]\n",
      "2= tensor([[-0.0752, -0.0883]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0572107  -0.23714718  0.00326738  0.31744736]\n",
      "2= tensor([[0.0518, 0.2182]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06195364 -0.43231553  0.00961633  0.6111589 ]\n",
      "2= tensor([[0.1130, 0.3454]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07059995 -0.23732929  0.02183951  0.32152024]\n",
      "2= tensor([[0.0537, 0.2237]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07534654 -0.04252505  0.02826991  0.03580386]\n",
      "2= tensor([[-0.0672, -0.0678]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07619704 -0.23804075  0.02898599  0.33727047]\n",
      "2= tensor([[0.0575, 0.2322]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08095785 -0.04334302  0.0357314   0.05386725]\n",
      "2= tensor([[-0.0601, -0.0468]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08182471  0.15124886  0.03680874 -0.22733146]\n",
      "2= tensor([[-0.2035, -0.4716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07879974 -0.04437926  0.03226212  0.07673129]\n",
      "2= tensor([[-0.0531, -0.0246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07968732  0.1502657   0.03379674 -0.2056008 ]\n",
      "2= tensor([[-0.1968, -0.4488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07668201 -0.04532285  0.02968473  0.09754883]\n",
      "2= tensor([[-0.0468, -0.0051]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07758847  0.14936136  0.0316357  -0.1856228 ]\n",
      "2= tensor([[-0.1902, -0.4269]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07460124  0.34401673  0.02792325 -0.4681604 ]\n",
      "2= tensor([[-0.3225, -0.8410]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0677209   0.14851163  0.01856004 -0.16680872]\n",
      "2= tensor([[-0.1856, -0.4092]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06475067 -0.04687101  0.01522386  0.1316711 ]\n",
      "2= tensor([[-0.0384,  0.0194]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06568809  0.1480296   0.01785729 -0.1561703 ]\n",
      "2= tensor([[-0.1821, -0.3980]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0627275  -0.04734341  0.01473388  0.14209227]\n",
      "2= tensor([[-0.0353,  0.0272]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06367437 -0.24267325  0.01757573  0.4393868 ]\n",
      "2= tensor([[0.0764, 0.2717]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06852783 -0.0478044   0.02636346  0.1522957 ]\n",
      "2= tensor([[-0.0309,  0.0380]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06948392 -0.24329373  0.02940938  0.45317775]\n",
      "2= tensor([[0.0792, 0.2786]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0743498  -0.43881896  0.03847293  0.75498384]\n",
      "2= tensor([[0.1153, 0.3811]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08312617 -0.24424788  0.05357261  0.4746515 ]\n",
      "2= tensor([[0.0829, 0.2878]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08801113 -0.04992178  0.06306564  0.19932334]\n",
      "2= tensor([[-0.0141,  0.0835]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08900957  0.14424413  0.0670521  -0.07281752]\n",
      "2= tensor([[-0.1458, -0.2946]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08612469 -0.05177183  0.06559575  0.24024425]\n",
      "2= tensor([[-0.0027,  0.1142]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08716013  0.14235474  0.07040064 -0.03104803]\n",
      "2= tensor([[-0.1307, -0.2482]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08431303 -0.05370248  0.06977968  0.28299   ]\n",
      "2= tensor([[0.0091, 0.1448]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08538707  0.14035839  0.07543948  0.01310569]\n",
      "2= tensor([[-0.1146, -0.1990]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08257991 -0.05575985  0.07570159  0.32860452]\n",
      "2= tensor([[0.0226, 0.1758]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08369511  0.13820736  0.08227368  0.060722  ]\n",
      "2= tensor([[-0.0975, -0.1471]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08093096 -0.05799194  0.08348812  0.37818667]\n",
      "2= tensor([[0.0363, 0.2044]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0820908   0.13585122  0.09105186  0.11295168]\n",
      "2= tensor([[-0.0789, -0.0921]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07937377 -0.06044945  0.09331089  0.43291524]\n",
      "2= tensor([[0.0496, 0.2320]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08058276  0.13323604  0.1019692   0.17104451]\n",
      "2= tensor([[-0.0587, -0.0337]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07791805  0.3267619   0.10539009 -0.08780939]\n",
      "2= tensor([[-0.1904, -0.4272]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07138281  0.13029952  0.1036339   0.23617643]\n",
      "2= tensor([[-0.0393,  0.0179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06877682  0.32379994  0.10835743 -0.02210308]\n",
      "2= tensor([[-0.1696, -0.3607]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06230081  0.12730433  0.10791536  0.30270648]\n",
      "2= tensor([[-0.0188,  0.0697]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05975473  0.32073605  0.1139695   0.04591232]\n",
      "2= tensor([[-0.1467, -0.2895]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05334001  0.12417996  0.11488774  0.37226826]\n",
      "2= tensor([[0.0003, 0.1210]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05085641  0.31749833  0.12233311  0.11790508]\n",
      "2= tensor([[-0.1213, -0.2126]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04450644  0.1208553   0.12469121  0.44654152]\n",
      "2= tensor([[0.0201, 0.1713]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04208934  0.31401306  0.13362204  0.19561866]\n",
      "2= tensor([[-0.0945, -0.1317]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03580907  0.117258    0.13753441  0.5272885 ]\n",
      "2= tensor([[0.0357, 0.2134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03346391 -0.0795038   0.14808019  0.8599519 ]\n",
      "2= tensor([[0.0949, 0.3456]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03505399  0.11332469  0.16527922  0.6172513 ]\n",
      "2= tensor([[0.0529, 0.2502]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03278749  0.30579916  0.17762424  0.38084516]\n",
      "2= tensor([[-0.0277,  0.0299]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02667151  0.49801287  0.18524115  0.14900832]\n",
      "2= tensor([[-0.1534, -0.3034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01671126  0.3007882   0.18822132  0.4939341 ]\n",
      "2= tensor([[0.0066, 0.1131]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01069549  0.49282664  0.1981      0.2659748 ]\n",
      "2= tensor([[-0.1129, -0.1859]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00083896  0.2955102   0.20341949  0.6140221 ]\n",
      "2= tensor([[0.0306, 0.1767]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04601555  0.00813139 -0.03986895 -0.03125285]\n",
      "2= tensor([[-0.1110, -0.1798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04585292 -0.1863968  -0.04049401  0.24858922]\n",
      "2= tensor([[0.0216, 0.1577]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04958085  0.00927935 -0.03552222 -0.05658639]\n",
      "2= tensor([[-0.1194, -0.2061]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04939527 -0.18531574 -0.03665395  0.22468077]\n",
      "2= tensor([[0.0151, 0.1431]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05310158  0.01031038 -0.03216033 -0.07933517]\n",
      "2= tensor([[-0.1272, -0.2308]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05289537 -0.18433614 -0.03374704  0.20303012]\n",
      "2= tensor([[0.0090, 0.1294]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0565821   0.01125178 -0.02968643 -0.10010446]\n",
      "2= tensor([[-0.1346, -0.2537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05635706 -0.18343242 -0.03168852  0.18306664]\n",
      "2= tensor([[0.0034, 0.1167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06002571  0.01212829 -0.02802719 -0.11944202]\n",
      "2= tensor([[-0.1414, -0.2749]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05978314  0.20764036 -0.03041603 -0.42083386]\n",
      "2= tensor([[-0.2866, -0.7221]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05563034  0.01296227 -0.03883271 -0.13789272]\n",
      "2= tensor([[-0.1494, -0.2977]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05537109 -0.18158258 -0.04159056  0.1422906 ]\n",
      "2= tensor([[-0.0087,  0.0867]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05900274  0.01410957 -0.03874475 -0.16321789]\n",
      "2= tensor([[-0.1580, -0.3251]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05872055 -0.18043692 -0.04200911  0.11699475]\n",
      "2= tensor([[-0.0156,  0.0684]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06232929  0.01526097 -0.03966921 -0.18864016]\n",
      "2= tensor([[-0.1667, -0.3525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06202407 -0.17927165 -0.04344201  0.09126952]\n",
      "2= tensor([[-0.0225,  0.0496]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0656095   0.01644517 -0.04161663 -0.21479668]\n",
      "2= tensor([[-0.1757, -0.3807]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0652806  -0.17805786 -0.04591256  0.0644735 ]\n",
      "2= tensor([[-0.0307,  0.0288]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06884176  0.01769126 -0.04462309 -0.2423343 ]\n",
      "2= tensor([[-0.1853, -0.4105]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06848793 -0.17676581 -0.04946978  0.03594612]\n",
      "2= tensor([[-0.0395,  0.0044]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07202325  0.01902935 -0.04875086 -0.2719255 ]\n",
      "2= tensor([[-0.1957, -0.4430]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07164266 -0.17536429 -0.05418937  0.00499143]\n",
      "2= tensor([[-0.0498, -0.0246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07514995 -0.3696689  -0.05408954  0.28009665]\n",
      "2= tensor([[0.0639, 0.2290]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08254332 -0.17381875 -0.0484876  -0.0291435 ]\n",
      "2= tensor([[-0.0599, -0.0558]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0860197   0.02196379 -0.04907047 -0.33672196]\n",
      "2= tensor([[-0.2168, -0.5134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08558042 -0.17242675 -0.05580491 -0.05990804]\n",
      "2= tensor([[-0.0709, -0.0886]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08902896 -0.366706   -0.05700307  0.21465907]\n",
      "2= tensor([[0.0497, 0.2009]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09636308 -0.1708174  -0.05270989 -0.09544642]\n",
      "2= tensor([[-0.0815, -0.1224]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09977943 -0.36514583 -0.05461882  0.18015184]\n",
      "2= tensor([[0.0414, 0.1844]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10708234 -0.5594454  -0.05101578  0.4551166 ]\n",
      "2= tensor([[0.1120, 0.3222]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11827125 -0.3636406  -0.04191345  0.14679943]\n",
      "2= tensor([[0.0330, 0.1693]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12554406 -0.16794428 -0.03897746 -0.1588062 ]\n",
      "2= tensor([[-0.0991, -0.1814]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12890294 -0.36248714 -0.04215359  0.12132999]\n",
      "2= tensor([[0.0262, 0.1561]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13615268 -0.1667874  -0.03972699 -0.18434834]\n",
      "2= tensor([[-0.1073, -0.2080]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.13948844 -0.36131907 -0.04341395  0.09554227]\n",
      "2= tensor([[0.0190, 0.1424]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.14671482 -0.16560265 -0.04150311 -0.21051545]\n",
      "2= tensor([[-0.1158, -0.2354]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.15002687 -0.36010736 -0.04571342  0.06879196]\n",
      "2= tensor([[0.0117, 0.1279]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.15722902 -0.16436085 -0.04433758 -0.23795614]\n",
      "2= tensor([[-0.1249, -0.2644]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.16051623 -0.35882226 -0.0490967   0.04041835]\n",
      "2= tensor([[0.0038, 0.1113]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.16769268 -0.1630319  -0.04828833 -0.2673419 ]\n",
      "2= tensor([[-0.1341, -0.2947]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.17095332 -0.35743263 -0.05363517  0.009728  ]\n",
      "2= tensor([[-0.0048,  0.0930]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.17810197 -0.16158414 -0.05344061 -0.29938346]\n",
      "2= tensor([[-0.1458, -0.3301]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18133366 -0.35590523 -0.05942828 -0.02402201]\n",
      "2= tensor([[-0.0141,  0.0719]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.18845177 -0.1599836  -0.05990872 -0.33484727]\n",
      "2= tensor([[-0.1610, -0.3735]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.19165143 -0.35420403 -0.06660566 -0.06164191]\n",
      "2= tensor([[-0.0231,  0.0452]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.19873552 -0.15819345 -0.0678385  -0.37457344]\n",
      "2= tensor([[-0.1785, -0.4240]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.20189938 -0.3522895  -0.07532997 -0.10402825]\n",
      "2= tensor([[-0.0334,  0.0107]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.20894517 -0.15617336 -0.07741054 -0.41949427]\n",
      "2= tensor([[-0.1998, -0.4838]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.21206865 -0.35011798 -0.08580042 -0.15218455]\n",
      "2= tensor([[-0.0498, -0.0428]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.219071   -0.15387894 -0.08884411 -0.47065467]\n",
      "2= tensor([[-0.2241, -0.5525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.22214858 -0.347641   -0.09825721 -0.20724371]\n",
      "2= tensor([[-0.0730, -0.1120]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.2291014  -0.5412306  -0.10240208  0.05289897]\n",
      "2= tensor([[0.0427, 0.1765]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.23992601 -0.3448008  -0.1013441  -0.2702559 ]\n",
      "2= tensor([[-0.0994, -0.1909]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.24682203 -0.5383415  -0.10674922 -0.01117858]\n",
      "2= tensor([[0.0239, 0.1386]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.25758886 -0.34186345 -0.10697279 -0.33554277]\n",
      "2= tensor([[-0.1267, -0.2729]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.2644261  -0.5353133  -0.11368365 -0.07841672]\n",
      "2= tensor([[0.0019, 0.0917]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.2751324  -0.33876073 -0.11525198 -0.4046935 ]\n",
      "2= tensor([[-0.1576, -0.3640]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.28190762 -0.5320757  -0.12334585 -0.15045388]\n",
      "2= tensor([[-0.0242,  0.0300]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.29254913 -0.3354232  -0.12635493 -0.47936332]\n",
      "2= tensor([[-0.1918, -0.4630]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.29925758 -0.13876514 -0.13594219 -0.8090483 ]\n",
      "2= tensor([[-0.3899, -1.0010]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.3020329  -0.33178854 -0.15212317 -0.56202847]\n",
      "2= tensor([[-0.2346, -0.5820]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.30866867 -0.52448523 -0.16336372 -0.32087332]\n",
      "2= tensor([[-0.0936, -0.1718]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.31915838 -0.71694964 -0.1697812  -0.08383612]\n",
      "2= tensor([[0.0249, 0.1223]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.33349735 -0.51985216 -0.17145792 -0.42490762]\n",
      "2= tensor([[-0.1408, -0.3090]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.3438944  -0.7121835  -0.17995608 -0.19080293]\n",
      "2= tensor([[-0.0193,  0.0329]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.35813808 -0.5150046  -0.18377213 -0.53441703]\n",
      "2= tensor([[-0.1935, -0.4594]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.36843815 -0.7071314  -0.19446047 -0.30480495]\n",
      "2= tensor([[-0.0679, -0.0884]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.3825808  -0.89902747 -0.20055658 -0.07919782]\n",
      "2= tensor([[0.0504, 0.1582]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.40056133 -0.70168006 -0.20214052 -0.4278546 ]\n",
      "2= tensor([[-0.1218, -0.2434]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00699923  0.00811477 -0.0439336   0.04386149]\n",
      "2= tensor([[-1.4162, -2.1363]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00716152 -0.18635055 -0.04305637  0.3223657 ]\n",
      "2= tensor([[-1.0894, -1.1904]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00343451 -0.38083377 -0.03660905  0.6011655 ]\n",
      "2= tensor([[-0.8969, -0.5937]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00418216 -0.18521935 -0.02458574  0.2971798 ]\n",
      "2= tensor([[-1.0998, -1.2270]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00788655 -0.37998235 -0.01864215  0.58200854]\n",
      "2= tensor([[-0.8992, -0.6042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0154862  -0.18460423 -0.00700198  0.28351182]\n",
      "2= tensor([[-1.1027, -1.2403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01917828 -0.37962562 -0.00133174  0.5739781 ]\n",
      "2= tensor([[-0.8999, -0.6061]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02677079 -0.18448502  0.01014782  0.28087598]\n",
      "2= tensor([[-1.0982, -1.2306]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0304605  -0.37975025  0.01576534  0.5767422 ]\n",
      "2= tensor([[-0.8984, -0.5984]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0380555  -0.18485278  0.02730019  0.2890671 ]\n",
      "2= tensor([[-1.0865, -1.1989]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04175255 -0.38035318  0.03308153  0.5902337 ]\n",
      "2= tensor([[-0.8951, -0.5821]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04935962 -0.18570966  0.0448862   0.30815235]\n",
      "2= tensor([[-1.0673, -1.1446]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05307381 -0.38144147  0.05104925  0.6146465 ]\n",
      "2= tensor([[-0.8902, -0.5568]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06070264 -0.18706861  0.06334218  0.33846894]\n",
      "2= tensor([[-1.0436, -1.0734]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06444401 -0.38303202  0.07011156  0.65043473]\n",
      "2= tensor([[-0.8842, -0.5221]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07210466 -0.18895306  0.08312025  0.38062742]\n",
      "2= tensor([[-1.0174, -0.9855]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07588372  0.00489627  0.0907328   0.11526655]\n",
      "2= tensor([[-1.2960, -1.8289]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07578579 -0.19140069  0.09303813  0.4351397 ]\n",
      "2= tensor([[-0.9920, -0.8947]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0796138   0.00228948  0.10174093  0.17317474]\n",
      "2= tensor([[-1.2491, -1.6881]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07956801 -0.19413032  0.10520442  0.4961411 ]\n",
      "2= tensor([[-0.9685, -0.8118]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08345062 -0.00063694  0.11512724  0.23837882]\n",
      "2= tensor([[-1.1995, -1.5342]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08346336 -0.19719927  0.11989482  0.5650432 ]\n",
      "2= tensor([[-0.9505, -0.7398]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08740734 -0.0039454   0.13119568  0.31240806]\n",
      "2= tensor([[-1.1439, -1.3618]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08748625 -0.20066857  0.13744384  0.6434179 ]\n",
      "2= tensor([[-0.9322, -0.6613]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09149963 -0.00770275  0.1503122   0.39698023]\n",
      "2= tensor([[-1.0944, -1.1917]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09165368 -0.20460199  0.1582518   0.73302436]\n",
      "2= tensor([[-0.9257, -0.5971]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09574572 -0.01197932  0.1729123   0.4940329 ]\n",
      "2= tensor([[-1.0477, -1.0170]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09598531  0.18033637  0.18279295  0.2604444 ]\n",
      "2= tensor([[-1.2902, -1.7807]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09237858 -0.01686029  0.18800184  0.60475373]\n",
      "2= tensor([[-1.0035, -0.8662]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09271578  0.17520432  0.20009692  0.3766807 ]\n",
      "2= tensor([[-1.2114, -1.5266]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08921169 -0.02211341  0.20763053  0.7251885 ]\n",
      "2= tensor([[-0.9741, -0.7594]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02555033 -0.03181644  0.02937931 -0.01890587]\n",
      "2= tensor([[-1.4449, -2.2399]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.024914   -0.22734714  0.02900119  0.2828999 ]\n",
      "2= tensor([[-1.0857, -1.2116]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02036705 -0.4228705   0.03465918  0.58458674]\n",
      "2= tensor([[-0.8925, -0.5824]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01190965 -0.22825074  0.04635092  0.3030202 ]\n",
      "2= tensor([[-1.0654, -1.1535]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00734463 -0.42400157  0.05241133  0.6099534 ]\n",
      "2= tensor([[-0.8875, -0.5556]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0011354  -0.22964992  0.06461039  0.3342281 ]\n",
      "2= tensor([[-1.0407, -1.0790]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0057284  -0.42562908  0.07129496  0.64656574]\n",
      "2= tensor([[-0.8801, -0.5190]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01424098 -0.23156914  0.08422627  0.37715825]\n",
      "2= tensor([[-1.0130, -0.9879]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01887236 -0.03773812  0.09176943  0.11217564]\n",
      "2= tensor([[-1.2931, -1.8323]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01962713 -0.23404704  0.09401295  0.43234232]\n",
      "2= tensor([[-0.9850, -0.8901]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02430807 -0.04037321  0.10265979  0.17071357]\n",
      "2= tensor([[-1.2425, -1.6865]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02511553 -0.23680328  0.10607406  0.4939364 ]\n",
      "2= tensor([[-0.9607, -0.8052]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0298516  -0.04332469  0.11595279  0.23647702]\n",
      "2= tensor([[-1.1915, -1.5290]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03071809 -0.23989588  0.12068233  0.5633676 ]\n",
      "2= tensor([[-0.9389, -0.7246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03551601 -0.04665559  0.13194968  0.31100997]\n",
      "2= tensor([[-1.1348, -1.3528]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03644912 -0.2433864   0.13816988  0.64222175]\n",
      "2= tensor([[-0.9251, -0.6509]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04131685 -0.0504333   0.15101431  0.39604324]\n",
      "2= tensor([[-1.0858, -1.1821]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04232552 -0.24733913  0.15893519  0.7322702 ]\n",
      "2= tensor([[-0.9168, -0.5822]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0472723  -0.05472858  0.17358059  0.4935262 ]\n",
      "2= tensor([[-1.0385, -1.0049]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04836687  0.137575    0.18345112  0.26018235]\n",
      "2= tensor([[-1.2795, -1.7641]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04561537 -0.05962704  0.18865475  0.60465443]\n",
      "2= tensor([[-0.9917, -0.8485]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04680791  0.13242573  0.20074785  0.37682265]\n",
      "2= tensor([[-1.2001, -1.5083]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04415939 -0.06489681  0.2082843   0.7254867 ]\n",
      "2= tensor([[-0.9645, -0.7386]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02368209 -0.02746007  0.04655463  0.02210722]\n",
      "2= tensor([[-1.4064, -2.1387]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02313289 -0.22321768  0.04699678  0.3291076 ]\n",
      "2= tensor([[-1.0552, -1.1224]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01866853 -0.41897607  0.05357893  0.6362329 ]\n",
      "2= tensor([[-0.8833, -0.5418]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01028901 -0.22464067  0.06630359  0.36089283]\n",
      "2= tensor([[-1.0312, -1.0492]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0057962  -0.42063937  0.07352144  0.6737238 ]\n",
      "2= tensor([[-0.8754, -0.5050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00261659 -0.22661209  0.08699592  0.405065  ]\n",
      "2= tensor([[-1.0043, -0.9578]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00714883 -0.42285308  0.09509722  0.7238579 ]\n",
      "2= tensor([[-0.8767, -0.4730]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01560589 -0.229166    0.10957438  0.46255642]\n",
      "2= tensor([[-0.9760, -0.8574]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02018921 -0.03574938  0.11882551  0.20632187]\n",
      "2= tensor([[-1.2202, -1.6196]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0209042  -0.23235238  0.12295195  0.53399944]\n",
      "2= tensor([[-0.9487, -0.7636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02555125 -0.03915453  0.13363193  0.28244722]\n",
      "2= tensor([[-1.1620, -1.4390]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02633434 -0.2359043   0.13928087  0.61411166]\n",
      "2= tensor([[-0.9321, -0.6857]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03105242 -0.04297512  0.15156311  0.36833665]\n",
      "2= tensor([[-1.1060, -1.2537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03191192 -0.23988913  0.15892984  0.7047108 ]\n",
      "2= tensor([[-0.9186, -0.6083]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03670971 -0.04728458  0.17302406  0.46597388]\n",
      "2= tensor([[-1.0577, -1.0743]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0376554  -0.24437481  0.18234354  0.80781066]\n",
      "2= tensor([[-0.9269, -0.5646]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0425429  -0.05215739  0.19849975  0.57757694]\n",
      "2= tensor([[-1.0031, -0.8891]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04281582  0.012769    0.00716604 -0.04449685]\n",
      "2= tensor([[-1.4747, -2.3070]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04256044 -0.18245497  0.0062761   0.2504384 ]\n",
      "2= tensor([[-1.1183, -1.2851]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04620954 -0.37766597  0.01128487  0.5450943 ]\n",
      "2= tensor([[-0.9052, -0.6225]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05376286 -0.1827044   0.02218675  0.25598824]\n",
      "2= tensor([[-1.1073, -1.2562]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05741695 -0.37813598  0.02730652  0.5555858 ]\n",
      "2= tensor([[-0.9012, -0.6059]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06497967 -0.18340786  0.03841824  0.27162963]\n",
      "2= tensor([[-1.0902, -1.2082]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06864782 -0.37905636  0.04385083  0.576178  ]\n",
      "2= tensor([[-0.8970, -0.5828]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07622895 -0.18457563  0.05537439  0.2976254 ]\n",
      "2= tensor([[-1.0664, -1.1395]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07992047 -0.38044143  0.06132689  0.6072455 ]\n",
      "2= tensor([[-0.8920, -0.5527]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08752929 -0.18622811  0.07347181  0.334492  ]\n",
      "2= tensor([[-1.0401, -1.0566]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09125386 -0.38231465  0.08016165  0.6494096 ]\n",
      "2= tensor([[-0.8849, -0.5129]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09890015 -0.18839546  0.09314984  0.38300714]\n",
      "2= tensor([[-1.0110, -0.9593]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10266806  0.00528901  0.10080998  0.12108644]\n",
      "2= tensor([[-1.2820, -1.7825]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10256228 -0.19112194  0.10323171  0.44379503]\n",
      "2= tensor([[-0.9837, -0.8615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10638472  0.00239946  0.11210761  0.18535456]\n",
      "2= tensor([[-1.2306, -1.6279]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10633673 -0.19413312  0.1158147   0.51119345]\n",
      "2= tensor([[-0.9634, -0.7850]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11021939 -0.00081673  0.12603857  0.25713488]\n",
      "2= tensor([[-1.1762, -1.4591]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11023573 -0.19749166  0.13118127  0.58676445]\n",
      "2= tensor([[-0.9442, -0.7072]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11418556 -0.0044273   0.14291656  0.3381129 ]\n",
      "2= tensor([[-1.1199, -1.2801]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11427411 -0.20126303  0.14967881  0.6722309 ]\n",
      "2= tensor([[-0.9269, -0.6265]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11829937 -0.00850367  0.16312343  0.43016613]\n",
      "2= tensor([[-1.0717, -1.1064]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11846944 -0.20551425  0.17172675  0.7695049 ]\n",
      "2= tensor([[-0.9310, -0.5790]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12257972 -0.01311935  0.18711685  0.5353973 ]\n",
      "2= tensor([[-1.0238, -0.9319]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12284211 -0.2103113   0.19782479  0.880714  ]\n",
      "2= tensor([[-0.9469, -0.5495]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02808134 -0.04567786 -0.01756223  0.04014535]\n",
      "2= tensor([[-1.3910, -2.0767]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02716779 -0.24054362 -0.01675933  0.3272359 ]\n",
      "2= tensor([[-1.0591, -1.1156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02235691 -0.43542302 -0.01021461  0.6145869 ]\n",
      "2= tensor([[-0.8842, -0.5494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01364845 -0.24015984  0.00207713  0.3187044 ]\n",
      "2= tensor([[-1.0576, -1.1156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00884526 -0.43531132  0.00845122  0.61204165]\n",
      "2= tensor([[-0.8840, -0.5456]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 1.3902952e-04 -2.4030848e-01  2.0692050e-02  3.2203248e-01]\n",
      "2= tensor([[-1.0495, -1.0940]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00466714 -0.4357189   0.0271327   0.6211684 ]\n",
      "2= tensor([[-0.8821, -0.5323]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01338152 -0.24098614  0.03955607  0.3371528 ]\n",
      "2= tensor([[-1.0353, -1.0512]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01820124 -0.436648    0.04629912  0.64204246]\n",
      "2= tensor([[-0.8781, -0.5091]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0269342  -0.24220099  0.05913997  0.36429155]\n",
      "2= tensor([[-1.0146, -0.9865]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03177822 -0.04796721  0.06642581  0.09082727]\n",
      "2= tensor([[-1.3033, -1.8522]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03273756 -0.24397528  0.06824235  0.4037058 ]\n",
      "2= tensor([[-0.9938, -0.9158]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03761707 -0.04988418  0.07631647  0.13329448]\n",
      "2= tensor([[-1.2649, -1.7422]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03861475 -0.24601163  0.07898235  0.44904464]\n",
      "2= tensor([[-0.9738, -0.8460]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04353499 -0.05209051  0.08796325  0.18226644]\n",
      "2= tensor([[-1.2233, -1.6202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0445768  -0.24835381  0.09160858  0.50135106]\n",
      "2= tensor([[-0.9516, -0.7736]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04954387 -0.05463451  0.1016356   0.23888579]\n",
      "2= tensor([[-1.1774, -1.4816]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05063656 -0.25105044  0.10641331  0.5618188 ]\n",
      "2= tensor([[-0.9346, -0.7075]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05565757 -0.05757013  0.11764969  0.30446643]\n",
      "2= tensor([[-1.1273, -1.3258]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05680897 -0.254155    0.12373902  0.63181466]\n",
      "2= tensor([[-0.9214, -0.6405]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06189207 -0.06095689  0.13637531  0.3805197 ]\n",
      "2= tensor([[-1.0815, -1.1705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06311122 -0.25772518  0.1439857   0.7129019 ]\n",
      "2= tensor([[-0.9129, -0.5764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06826571 -0.06485918  0.15824375  0.46878228]\n",
      "2= tensor([[-1.0389, -1.0117]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0695629   0.12771489  0.16761939  0.22986005]\n",
      "2= tensor([[-1.2886, -1.7901]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0670086  -0.06935623  0.1722166   0.57037336]\n",
      "2= tensor([[-0.9951, -0.8636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06839573  0.12298552  0.18362406  0.3365104 ]\n",
      "2= tensor([[-1.2122, -1.5499]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06593601 -0.07420983  0.19035426  0.6810133 ]\n",
      "2= tensor([[-0.9648, -0.7488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06742021  0.1178302   0.20397453  0.45378318]\n",
      "2= tensor([[-1.1434, -1.3153]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00717171 -0.03425798 -0.01702549 -0.03195477]\n",
      "2= tensor([[-1.4570, -2.2564]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00648655 -0.2291317  -0.01766459  0.25530818]\n",
      "2= tensor([[-1.1087, -1.2606]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00190391 -0.42399704 -0.01255842  0.54236746]\n",
      "2= tensor([[-0.9004, -0.6118]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00657603 -0.22870086 -0.00171107  0.24575421]\n",
      "2= tensor([[-1.1092, -1.2646]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01115004 -0.42379832  0.00320401  0.53789693]\n",
      "2= tensor([[-0.8997, -0.6078]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01962601 -0.22872156  0.01396195  0.24622528]\n",
      "2= tensor([[-1.1018, -1.2455]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02420044 -0.4240401   0.01888645  0.54327923]\n",
      "2= tensor([[-0.8985, -0.5972]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03268124 -0.2291886   0.02975204  0.25660637]\n",
      "2= tensor([[-1.0876, -1.2060]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03726501 -0.42472243  0.03488417  0.5585231 ]\n",
      "2= tensor([[-0.8951, -0.5780]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04575946 -0.23010705  0.04605463  0.27703154]\n",
      "2= tensor([[-1.0678, -1.1477]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0503616  -0.03567138  0.05159526 -0.00077747]\n",
      "2= tensor([[-1.3906, -2.0857]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05107503 -0.23149386  0.05157971  0.30772763]\n",
      "2= tensor([[-1.0465, -1.0814]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05570491 -0.42731136  0.05773426  0.616221  ]\n",
      "2= tensor([[-0.8837, -0.5216]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06425114 -0.23304152  0.07005868  0.3422662 ]\n",
      "2= tensor([[-1.0212, -1.0028]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06891197 -0.03898262  0.07690401  0.07247231]\n",
      "2= tensor([[-1.3091, -1.8653]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06969162 -0.23511803  0.07835345  0.38839337]\n",
      "2= tensor([[-0.9966, -0.9205]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07439398 -0.04119061  0.08612132  0.12140706]\n",
      "2= tensor([[-1.2656, -1.7387]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07521779 -0.2374341   0.08854946  0.43996972]\n",
      "2= tensor([[-0.9736, -0.8385]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07996648 -0.04366963  0.09734885  0.17646126]\n",
      "2= tensor([[-1.2195, -1.6023]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08083986 -0.24004021  0.10087808  0.4981979 ]\n",
      "2= tensor([[-0.9523, -0.7665]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08564067 -0.04647446  0.11084204  0.23893325]\n",
      "2= tensor([[-1.1693, -1.4507]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08657016 -0.24299096  0.1156207   0.5644199 ]\n",
      "2= tensor([[-0.9351, -0.6968]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09142998 -0.04966484  0.1269091   0.31028372]\n",
      "2= tensor([[-1.1171, -1.2875]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09242328 -0.24634495  0.13311477  0.6401425 ]\n",
      "2= tensor([[-0.9205, -0.6247]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09735017 -0.05330534  0.14591762  0.39216498]\n",
      "2= tensor([[-1.0710, -1.1275]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09841628 -0.25016403  0.15376092  0.7270627 ]\n",
      "2= tensor([[-0.9161, -0.5630]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10341956 -0.0574644   0.16830218  0.4864512 ]\n",
      "2= tensor([[-1.0257, -0.9586]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10456885  0.13493283  0.1780312   0.25118062]\n",
      "2= tensor([[-1.2641, -1.7104]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10187019 -0.06222541  0.18305482  0.59430873]\n",
      "2= tensor([[-0.9882, -0.8275]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1031147   0.12992635  0.19494098  0.3644148 ]\n",
      "2= tensor([[-1.1879, -1.4636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10051618 -0.0673543   0.20222929  0.7116811 ]\n",
      "2= tensor([[-0.9612, -0.7218]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04161325 -0.00840268  0.01603106 -0.04938551]\n",
      "2= tensor([[-1.4976, -2.3842]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0414452  -0.20375079  0.01504335  0.24831192]\n",
      "2= tensor([[-1.1313, -1.3440]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03737018 -0.39908433  0.02000959  0.5457016 ]\n",
      "2= tensor([[-0.9088, -0.6466]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0293885  -0.20424914  0.03092362  0.25938982]\n",
      "2= tensor([[-1.1159, -1.3015]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02530351 -0.3997986   0.03611141  0.56166387]\n",
      "2= tensor([[-0.9014, -0.6207]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01730754 -0.5954082   0.04734469  0.86550146]\n",
      "2= tensor([[-0.8721, -0.3543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00539938 -0.40096152  0.06465472  0.58807236]\n",
      "2= tensor([[-0.8956, -0.5895]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00261985 -0.20680174  0.07641617  0.31643647]\n",
      "2= tensor([[-1.0587, -1.1384]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00675589 -0.40292427  0.0827449   0.6322062 ]\n",
      "2= tensor([[-0.8866, -0.5468]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01481437 -0.20904827  0.09538902  0.36668646]\n",
      "2= tensor([[-1.0261, -1.0338]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01899534 -0.40538713  0.10272275  0.68785775]\n",
      "2= tensor([[-0.8792, -0.4985]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02710308 -0.21182962  0.11647991  0.42919937]\n",
      "2= tensor([[-0.9934, -0.9135]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03133968 -0.40839186  0.1250639   0.75621253]\n",
      "2= tensor([[-0.8879, -0.4661]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03950751 -0.21519522  0.14018814  0.505354  ]\n",
      "2= tensor([[-0.9605, -0.7989]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04381141 -0.0222983   0.15029523  0.2599276 ]\n",
      "2= tensor([[-1.1805, -1.4936]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04425738 -0.2192105   0.15549378  0.59598684]\n",
      "2= tensor([[-0.9390, -0.7079]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04864159 -0.02656719  0.16741352  0.35603935]\n",
      "2= tensor([[-1.1165, -1.2841]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04917293 -0.22362453  0.1745343   0.6964827 ]\n",
      "2= tensor([[-0.9246, -0.6216]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05364542 -0.03129729  0.18846396  0.46342775]\n",
      "2= tensor([[-1.0625, -1.0856]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05427137 -0.22851278  0.19773251  0.8090939 ]\n",
      "2= tensor([[-0.9335, -0.5754]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00632099 -0.03273036  0.03026335  0.04434704]\n",
      "2= tensor([[-1.3779, -2.0525]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00566638 -0.22827291  0.03115029  0.3464226 ]\n",
      "2= tensor([[-1.0415, -1.0707]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00110092 -0.42382377  0.03807874  0.64876336]\n",
      "2= tensor([[-0.8787, -0.5204]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00737555 -0.22925241  0.05105401  0.3683103 ]\n",
      "2= tensor([[-1.0232, -1.0155]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0119606  -0.03489166  0.05842021  0.09215239]\n",
      "2= tensor([[-1.3206, -1.8999]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01265843 -0.2308002   0.06026326  0.40267965]\n",
      "2= tensor([[-1.0040, -0.9493]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01727444 -0.03658243  0.06831685  0.12958851]\n",
      "2= tensor([[-1.2839, -1.7992]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01800609 -0.23261315  0.07090863  0.4430182 ]\n",
      "2= tensor([[-0.9858, -0.8844]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02265835 -0.03856242  0.07976899  0.17350326]\n",
      "2= tensor([[-1.2464, -1.6895]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0234296  -0.23473005  0.08323906  0.49024624]\n",
      "2= tensor([[-0.9650, -0.8176]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0281242  -0.04087492  0.09304398  0.22491437]\n",
      "2= tensor([[-1.2040, -1.5632]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0289417  -0.23719499  0.09754227  0.5454362 ]\n",
      "2= tensor([[-0.9440, -0.7453]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0336856  -0.43354246  0.10845099  0.86718935]\n",
      "2= tensor([[-0.8968, -0.4261]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04235645 -0.24005014  0.12579478  0.61047816]\n",
      "2= tensor([[-0.9294, -0.6770]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04715745 -0.04689015  0.13800435  0.35991386]\n",
      "2= tensor([[-1.1037, -1.2450]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04809525 -0.24367638  0.14520262  0.6927314 ]\n",
      "2= tensor([[-0.9173, -0.6063]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05296878 -0.05083537  0.15905724  0.44905362]\n",
      "2= tensor([[-1.0588, -1.0794]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05398549 -0.24780743  0.16803832  0.78734803]\n",
      "2= tensor([[-0.9223, -0.5602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05894164 -0.05534306  0.18378527  0.55188894]\n",
      "2= tensor([[-1.0080, -0.9057]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0600485   0.13678688  0.19482306  0.32227674]\n",
      "2= tensor([[-1.2323, -1.6137]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05731276 -0.06049833  0.2012686   0.6695225 ]\n",
      "2= tensor([[-0.9732, -0.7764]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01289518 -0.03607798  0.02664627  0.0127448 ]\n",
      "2= tensor([[-1.4083, -2.1360]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01217362 -0.23157173  0.02690116  0.3137144 ]\n",
      "2= tensor([[-1.0604, -1.1315]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00754219 -0.42706636  0.03317545  0.61475825]\n",
      "2= tensor([[-0.8853, -0.5489]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00099914 -0.23242329  0.04547061  0.3327061 ]\n",
      "2= tensor([[-1.0433, -1.0809]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0056476  -0.42816195  0.05212474  0.6393744 ]\n",
      "2= tensor([[-0.8805, -0.5227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01421084 -0.23380403  0.06491222  0.36355117]\n",
      "2= tensor([[-1.0204, -1.0097]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01888692 -0.03966181  0.07218325  0.09202194]\n",
      "2= tensor([[-1.3122, -1.8802]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01968016 -0.23574015  0.07402369  0.40657702]\n",
      "2= tensor([[-0.9974, -0.9297]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02439496 -0.04174165  0.08215523  0.13811925]\n",
      "2= tensor([[-1.2696, -1.7603]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0252298  -0.23793833  0.08491761  0.45554814]\n",
      "2= tensor([[-0.9755, -0.8543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02998856 -0.04411323  0.09402858  0.19079389]\n",
      "2= tensor([[-1.2252, -1.6301]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03087083 -0.24044578  0.09784445  0.5115955 ]\n",
      "2= tensor([[-0.9528, -0.7775]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03567974 -0.04682837  0.10807636  0.25127885]\n",
      "2= tensor([[-1.1779, -1.4843]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03661631 -0.24331434  0.11310194  0.5760008 ]\n",
      "2= tensor([[-0.9345, -0.7071]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0414826  -0.04994433  0.12462196  0.32098013]\n",
      "2= tensor([[-1.1256, -1.3213]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04248148 -0.24660027  0.13104156  0.65022045]\n",
      "2= tensor([[-0.9222, -0.6383]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04741349 -0.05352353  0.14404596  0.40150446]\n",
      "2= tensor([[-1.0800, -1.1612]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04848396 -0.25036347  0.15207605  0.7359097 ]\n",
      "2= tensor([[-0.9151, -0.5745]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05349123 -0.05763265  0.16679426  0.4946882 ]\n",
      "2= tensor([[-1.0350, -0.9928]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05464388  0.1347929   0.17668802  0.25886604]\n",
      "2= tensor([[-1.2763, -1.7543]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05194803 -0.06235345  0.18186533  0.601658  ]\n",
      "2= tensor([[-0.9908, -0.8456]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05319509  0.12982132  0.1938985   0.371324  ]\n",
      "2= tensor([[-1.1998, -1.5073]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05059867 -0.0674504   0.20132497  0.71833605]\n",
      "2= tensor([[-0.9634, -0.7368]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00510429 -0.02000676  0.00496036  0.02755735]\n",
      "2= tensor([[-3.7601, -6.2652]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00470416  0.1750437   0.00551151 -0.26355642]\n",
      "2= tensor([[-4.8646, -8.6623]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00820503 -0.02015648  0.00024038  0.03085979]\n",
      "2= tensor([[-3.7590, -6.2616]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0078019  -0.21528187  0.00085757  0.32361856]\n",
      "2= tensor([[-2.9202, -4.3814]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00349626 -0.41041604  0.00732994  0.6165718 ]\n",
      "2= tensor([[-2.5031, -3.3716]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00471206 -0.60563964  0.01966138  0.9115543 ]\n",
      "2= tensor([[-2.4805, -3.1235]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01682485 -0.801022    0.03789246  1.2103513 ]\n",
      "2= tensor([[-2.6681, -3.2715]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03284529 -0.9966122   0.06209949  1.5146637 ]\n",
      "2= tensor([[-2.9089, -3.5087]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05277753 -1.1924284   0.09239276  1.8260673 ]\n",
      "2= tensor([[-3.1831, -3.8063]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0766261  -1.3884456   0.12891412  2.145964  ]\n",
      "2= tensor([[-3.4655, -4.1197]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10439502 -1.5845811   0.1718334   2.4755218 ]\n",
      "2= tensor([[-3.7675, -4.4598]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02975614 -0.03720639  0.01027982 -0.01010569]\n",
      "2= tensor([[-3.8352, -6.4405]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02901202 -0.23247425  0.0100777   0.28580284]\n",
      "2= tensor([[-2.9642, -4.4974]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02436253 -0.42773846  0.01579376  0.5816471 ]\n",
      "2= tensor([[-2.5073, -3.3986]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01580776 -0.6230781   0.0274267   0.87926316]\n",
      "2= tensor([[-2.4616, -3.0995]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0033462  -0.81856173  0.04501196  1.1804408 ]\n",
      "2= tensor([[-2.6505, -3.2501]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01302504 -1.0142382   0.06862078  1.4868872 ]\n",
      "2= tensor([[-2.8920, -3.4872]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0333098  -1.2101259   0.09835853  1.8001859 ]\n",
      "2= tensor([[-3.1673, -3.7852]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05751232 -1.4062005   0.13436225  2.1217473 ]\n",
      "2= tensor([[-3.4506, -4.0996]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08563633 -1.6023804   0.17679718  2.4527485 ]\n",
      "2= tensor([[-3.7574, -4.4454]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.0074253  0.01672071 0.02478347 0.03171742]\n",
      "2= tensor([[-3.8107, -6.3754]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00775972 -0.17874771  0.02541781  0.33211562]\n",
      "2= tensor([[-2.9568, -4.4556]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.00418476 0.01600339 0.03206013 0.04755534]\n",
      "2= tensor([[-3.7708, -6.2846]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00450483 -0.17956325  0.03301124  0.35017863]\n",
      "2= tensor([[-2.9295, -4.3887]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00091356 -0.37513876  0.04001481  0.6530856 ]\n",
      "2= tensor([[-2.5249, -3.4034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00658921 -0.5707944   0.05307652  0.9580954 ]\n",
      "2= tensor([[-2.5296, -3.2099]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0180051  -0.37642473  0.07223842  0.6825486 ]\n",
      "2= tensor([[-2.5184, -3.3698]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02553359 -0.57247156  0.0858894   0.9970715 ]\n",
      "2= tensor([[-2.5662, -3.2509]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03698302 -0.76863045  0.10583083  1.3154457 ]\n",
      "2= tensor([[-2.7714, -3.4252]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05235563 -0.9649202   0.13213974  1.6392893 ]\n",
      "2= tensor([[-3.0438, -3.7202]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07165404 -1.1613204   0.16492553  1.9700574 ]\n",
      "2= tensor([[-3.3318, -4.0424]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09488045 -1.3577559   0.20432667  2.308981  ]\n",
      "2= tensor([[-3.6358, -4.3877]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00474454  0.01664718  0.03323909  0.02021623]\n",
      "2= tensor([[-3.8158, -6.3889]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0044116  -0.1789353   0.03364341  0.3231984 ]\n",
      "2= tensor([[-2.9564, -4.4554]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00799031 -0.37451977  0.04010738  0.62629837]\n",
      "2= tensor([[-2.5275, -3.4204]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0154807  -0.5701779   0.05263335  0.931338  ]\n",
      "2= tensor([[-2.5180, -3.1944]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02688426 -0.76596916  0.07126011  1.2400852 ]\n",
      "2= tensor([[-2.7023, -3.3330]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04220364 -0.9619301   0.09606181  1.5542134 ]\n",
      "2= tensor([[-2.9568, -3.5922]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06144224 -1.1580632   0.12714608  1.8752555 ]\n",
      "2= tensor([[-3.2375, -3.9044]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08460351 -1.3543231   0.16465119  2.204549  ]\n",
      "2= tensor([[-3.5274, -4.2283]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11168997 -1.5506009   0.20874217  2.543173  ]\n",
      "2= tensor([[-3.8379, -4.5829]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00241061 -0.00407178 -0.04918326 -0.00254163]\n",
      "2= tensor([[-3.8842, -6.5276]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00232918 -0.19845513 -0.0492341   0.27422675]\n",
      "2= tensor([[-3.0320, -4.6301]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00163993 -0.39284128 -0.04374956  0.5509837 ]\n",
      "2= tensor([[-2.5424, -3.4804]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00949675 -0.58732235 -0.03272989  0.82956785]\n",
      "2= tensor([[-2.4315, -3.0726]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0212432  -0.78198195 -0.01613853  1.11178   ]\n",
      "2= tensor([[-2.5748, -3.1471]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03688284 -0.97688824  0.00609707  1.3993568 ]\n",
      "2= tensor([[-2.7947, -3.3524]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0564206  -1.1720854   0.03408421  1.6939398 ]\n",
      "2= tensor([[-3.0483, -3.6121]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07986231 -0.97737306  0.067963    1.4120597 ]\n",
      "2= tensor([[-2.8414, -3.4174]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09940977 -1.1732686   0.0962042   1.7251902 ]\n",
      "2= tensor([[-3.1161, -3.7096]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12287515 -1.3693504   0.13070801  2.0461934 ]\n",
      "2= tensor([[-3.3980, -4.0217]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.15026215 -1.5655494   0.17163187  2.3763003 ]\n",
      "2= tensor([[-3.6993, -4.3606]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01354024 0.04828739 0.03832537 0.04449205]\n",
      "2= tensor([[-3.8478, -6.4483]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01450599  0.24283941  0.03921521 -0.23585679]\n",
      "2= tensor([[-4.9031, -8.7351]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.01936278 0.04717977 0.03449807 0.06893336]\n",
      "2= tensor([[-3.8042, -6.3481]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02030637 -0.14841937  0.03587674  0.3722979 ]\n",
      "2= tensor([[-2.9581, -4.4431]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01733798 -0.34403214  0.0433227   0.67607373]\n",
      "2= tensor([[-2.5502, -3.4499]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01045734 -0.53972846  0.05684417  0.9820757 ]\n",
      "2= tensor([[-2.5563, -3.2703]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-3.3722792e-04 -7.3556417e-01  7.6485686e-02  1.2920580e+00]\n",
      "2= tensor([[-2.7363, -3.3960]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01504851 -0.9315706   0.10232685  1.6076729 ]\n",
      "2= tensor([[-2.9920, -3.6637]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03367992 -1.1277424   0.1344803   1.9304231 ]\n",
      "2= tensor([[-3.2748, -3.9787]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05623477 -1.3240242   0.17308877  2.2616057 ]\n",
      "2= tensor([[-3.5717, -4.3140]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00352451  0.01009153 -0.04975632 -0.04635743]\n",
      "2= tensor([[-4.0145, -6.8145]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00372634 -0.18428294 -0.05068346  0.23022112]\n",
      "2= tensor([[-3.1299, -4.8536]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 4.0684445e-05 -3.7864539e-01 -4.6079043e-02  5.0649583e-01]\n",
      "2= tensor([[-2.5863, -3.5869]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00753222 -0.18290545 -0.03594913  0.19965515]\n",
      "2= tensor([[-3.1672, -4.9406]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01119033 -0.3774953  -0.03195602  0.48078454]\n",
      "2= tensor([[-2.5964, -3.6148]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01874024 -0.5721519  -0.02234033  0.7632269 ]\n",
      "2= tensor([[-2.4224, -3.0842]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03018328 -0.76695913 -0.00707579  1.0487974 ]\n",
      "2= tensor([[-2.5359, -3.1043]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04552246 -0.96198654  0.01390015  1.3392508 ]\n",
      "2= tensor([[-2.7577, -3.3110]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06476219 -1.1572807   0.04068517  1.6362504 ]\n",
      "2= tensor([[-3.0092, -3.5673]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08790781 -1.3528556   0.07341018  1.941328  ]\n",
      "2= tensor([[-3.2794, -3.8563]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11496492 -1.5486798   0.11223674  2.2558365 ]\n",
      "2= tensor([[-3.5660, -4.1748]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14593852 -1.7446619   0.15735346  2.5808885 ]\n",
      "2= tensor([[-3.8779, -4.5257]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.18083175 -1.940633    0.20897123  2.9172845 ]\n",
      "2= tensor([[-4.2043, -4.8943]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0274218  -0.02599783 -0.00674902 -0.00240896]\n",
      "2= tensor([[-3.8451, -6.4562]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02690184 -0.22102234 -0.0067972   0.28813696]\n",
      "2= tensor([[-2.9819, -4.5316]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0224814  -0.4160467  -0.00103446  0.57866836]\n",
      "2= tensor([[-2.5131, -3.4154]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01416046 -0.61115414  0.0105389   0.87102526]\n",
      "2= tensor([[-2.4550, -3.0956]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00193738 -0.8064178   0.02795941  1.1670029 ]\n",
      "2= tensor([[-2.6327, -3.2277]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01419098 -1.0018922   0.05129946  1.4683189 ]\n",
      "2= tensor([[-2.8661, -3.4521]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03422882 -1.1976031   0.08066584  1.7765744 ]\n",
      "2= tensor([[-3.1378, -3.7435]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05818088 -1.3935357   0.11619733  2.0932076 ]\n",
      "2= tensor([[-3.4172, -4.0524]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0860516  -1.5896207   0.15806149  2.419437  ]\n",
      "2= tensor([[-3.7179, -4.3905]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11784401 -1.7857175   0.20645022  2.7561922 ]\n",
      "2= tensor([[-4.0444, -4.7600]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00724027 -0.03913643 -0.04151165 -0.01019387]\n",
      "2= tensor([[-3.8228, -6.3981]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.008023   -0.23363921 -0.04171553  0.26910806]\n",
      "2= tensor([[-2.9793, -4.5137]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01269579 -0.4281418  -0.03633337  0.5483473 ]\n",
      "2= tensor([[-2.5080, -3.4018]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02125862 -0.622735   -0.02536642  0.8293648 ]\n",
      "2= tensor([[-2.4210, -3.0321]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03371332 -0.8175012  -0.00877913  1.1139631 ]\n",
      "2= tensor([[-2.5835, -3.1434]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05006335 -1.0125067   0.01350014  1.4038792 ]\n",
      "2= tensor([[-2.8050, -3.3504]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07031348 -1.2077937   0.04157772  1.7007519 ]\n",
      "2= tensor([[-3.0639, -3.6184]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09446935 -1.4033693   0.07559276  2.006082  ]\n",
      "2= tensor([[-3.3349, -3.9107]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12253674 -1.599193    0.1157144   2.3211818 ]\n",
      "2= tensor([[-3.6277, -4.2374]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1545206  -1.7951616   0.16213803  2.647113  ]\n",
      "2= tensor([[-3.9417, -4.5903]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04474044 0.01684372 0.01075624 0.0109278 ]\n",
      "2= tensor([[-3.9077, -6.5911]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04507731 -0.17843083  0.0109748   0.30698496]\n",
      "2= tensor([[-3.0284, -4.6280]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04150869 -0.37370744  0.01711449  0.60310876]\n",
      "2= tensor([[-2.5458, -3.4819]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03403455 -0.5690645   0.02917667  0.9011329 ]\n",
      "2= tensor([[-2.4916, -3.1782]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02265326 -0.7645694   0.04719933  1.2028421 ]\n",
      "2= tensor([[-2.6611, -3.2889]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00736187 -0.96026874  0.07125617  1.5099357 ]\n",
      "2= tensor([[-2.9015, -3.5246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01184351 -1.1561781   0.10145488  1.8239856 ]\n",
      "2= tensor([[-3.1771, -3.8282]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03496707 -0.962318    0.1379346   1.5644673 ]\n",
      "2= tensor([[-2.9896, -3.6533]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05421343 -1.1587931   0.16922393  1.896805  ]\n",
      "2= tensor([[-3.2783, -3.9766]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07738929 -1.3552969   0.20716004  2.236865  ]\n",
      "2= tensor([[-3.5793, -4.3167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01896788 -0.00337314 -0.03028792  0.01845415]\n",
      "2= tensor([[-3.8440, -6.4426]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01890042 -0.19804794 -0.02991883  0.30142912]\n",
      "2= tensor([[-2.9970, -4.5537]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01493946 -0.39273095 -0.02389025  0.58452815]\n",
      "2= tensor([[-2.5259, -3.4420]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00708484 -0.5875102  -0.01219969  0.86959064]\n",
      "2= tensor([[-2.4534, -3.1019]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00466536 -0.78246415  0.00519212  1.158413  ]\n",
      "2= tensor([[-2.6152, -3.2071]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02031465 -0.9776534   0.02836039  1.4527194 ]\n",
      "2= tensor([[-2.8396, -3.4184]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03986771 -1.1731119   0.05741477  1.7541263 ]\n",
      "2= tensor([[-3.1050, -3.6988]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06332995 -1.368836    0.0924973   2.0640993 ]\n",
      "2= tensor([[-3.3792, -4.0006]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09070668 -1.5647708   0.13377929  2.3839004 ]\n",
      "2= tensor([[-3.6707, -4.3266]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12200209 -1.7607938   0.1814573   2.7145216 ]\n",
      "2= tensor([[-3.9900, -4.6861]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0169486  -0.03376559 -0.015682   -0.0176072 ]\n",
      "2= tensor([[-3.8200, -6.3968]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01762391 -0.22865917 -0.01603414  0.2700869 ]\n",
      "2= tensor([[-2.9667, -4.4866]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0221971  -0.4235487  -0.0106324   0.55766976]\n",
      "2= tensor([[-2.5033, -3.3876]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-3.0668072e-02 -6.1851978e-01  5.2099297e-04  8.4698403e-01]\n",
      "2= tensor([[-2.4422, -3.0588]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04303847 -0.8136488   0.01746067  1.1398307 ]\n",
      "2= tensor([[-2.6141, -3.1874]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05931145 -1.0089947   0.04025729  1.437938  ]\n",
      "2= tensor([[-2.8437, -3.4059]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07949134 -1.204589    0.06901605  1.7429242 ]\n",
      "2= tensor([[-3.1132, -3.6896]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10358312 -1.4004251   0.10387453  2.0562537 ]\n",
      "2= tensor([[-3.3898, -3.9943]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.13159162 -1.5964441   0.14499961  2.3791816 ]\n",
      "2= tensor([[-3.6885, -4.3294]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1635205  -1.7925191   0.19258323  2.7126882 ]\n",
      "2= tensor([[-4.0089, -4.6909]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00317097  0.0478257  -0.03294344  0.01933123]\n",
      "2= tensor([[-3.9098, -6.5781]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00221446 -0.1468087  -0.03255682  0.3014408 ]\n",
      "2= tensor([[-3.0546, -4.6705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00515063 -0.34145185 -0.026528    0.5836808 ]\n",
      "2= tensor([[-2.5671, -3.5217]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01197967 -0.53619236 -0.01485439  0.8678904 ]\n",
      "2= tensor([[-2.4724, -3.1511]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02270352 -0.731109    0.00250342  1.1558663 ]\n",
      "2= tensor([[-2.6101, -3.2148]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0373257  -0.5360198   0.02562075  0.8639693 ]\n",
      "2= tensor([[-2.4904, -3.1720]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04804609 -0.731481    0.04290013  1.1645966 ]\n",
      "2= tensor([[-2.6429, -3.2610]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06267571 -0.536943    0.06619206  0.8856667 ]\n",
      "2= tensor([[-2.5191, -3.2042]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07341457 -0.7328981   0.0839054   1.198402  ]\n",
      "2= tensor([[-2.6915, -3.3267]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08807254 -0.92899954  0.10787344  1.5161586 ]\n",
      "2= tensor([[-2.9387, -3.5717]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10665253 -1.1252487   0.13819662  1.8404745 ]\n",
      "2= tensor([[-3.2214, -3.8860]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1291575 -1.3215995  0.1750061  2.1726935]\n",
      "2= tensor([[-3.5129, -4.2121]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00374298  0.02467415 -0.01536449 -0.02551565]\n",
      "2= tensor([[-3.9681, -6.7167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00423647 -0.17022413 -0.0158748   0.2622803 ]\n",
      "2= tensor([[-3.0779, -4.7389]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00083199 -0.3651159  -0.01062919  0.5499141 ]\n",
      "2= tensor([[-2.5627, -3.5297]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-6.4703333e-03 -5.6008697e-01  3.6908788e-04  8.3922929e-01]\n",
      "2= tensor([[-2.4578, -3.1250]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01767207 -0.755214    0.01715367  1.1320282 ]\n",
      "2= tensor([[-2.6021, -3.2007]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03277635 -0.9505562   0.03979424  1.4300414 ]\n",
      "2= tensor([[-2.8289, -3.4146]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05178748 -1.1461463   0.06839507  1.7348907 ]\n",
      "2= tensor([[-3.0962, -3.6979]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0747104  -1.3419784   0.10309288  2.0480447 ]\n",
      "2= tensor([[-3.3724, -4.0025]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10154997 -1.5379955   0.14405377  2.3707647 ]\n",
      "2= tensor([[-3.6632, -4.3276]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.13230988 -1.734072    0.19146906  2.7040386 ]\n",
      "2= tensor([[-3.9850, -4.6918]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03415581 -0.0362357   0.02048484  0.00267838]\n",
      "2= tensor([[-3.7303, -6.2027]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03488053 -0.23164535  0.02053841  0.3017535 ]\n",
      "2= tensor([[-2.8886, -4.3095]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03951344 -0.42705393  0.02657348  0.60084236]\n",
      "2= tensor([[-2.4915, -3.3340]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04805451 -0.6225373   0.03859033  0.90177566]\n",
      "2= tensor([[-2.4902, -3.1188]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06050526 -0.81816024  0.05662584  1.2063344 ]\n",
      "2= tensor([[-2.6796, -3.2725]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07686847 -1.0139663   0.08075253  1.5162117 ]\n",
      "2= tensor([[-2.9301, -3.5249]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09714779 -1.2099671   0.11107676  1.8329704 ]\n",
      "2= tensor([[-3.2079, -3.8265]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12134714 -1.4061294   0.14773618  2.1579897 ]\n",
      "2= tensor([[-3.4942, -4.1451]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14946972 -1.6023594   0.19089596  2.4924052 ]\n",
      "2= tensor([[-3.8024, -4.4938]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03894126  0.04410342  0.03572914  0.01259127]\n",
      "2= tensor([[-3.8416, -6.4385]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03805919 -0.15151224  0.03598096  0.3163296 ]\n",
      "2= tensor([[-2.9775, -4.4924]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04108944 -0.34712774  0.04230756  0.62013906]\n",
      "2= tensor([[-2.5406, -3.4442]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04803199 -0.5428142   0.05471034  0.92584085]\n",
      "2= tensor([[-2.5289, -3.2139]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05888828 -0.73863065  0.07322715  1.2352028 ]\n",
      "2= tensor([[-2.7064, -3.3428]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07366089 -0.9346134   0.09793121  1.5498986 ]\n",
      "2= tensor([[-2.9560, -3.5931]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09235316 -1.1307645   0.12892918  1.8714613 ]\n",
      "2= tensor([[-3.2370, -3.9061]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11496845 -1.3270383   0.16635841  2.2012289 ]\n",
      "2= tensor([[-3.5270, -4.2305]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04293507 -0.00567857  0.02183285  0.0392197 ]\n",
      "2= tensor([[-3.6969, -6.1208]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04304864 -0.20110668  0.02261724  0.33871037]\n",
      "2= tensor([[-2.8791, -4.2705]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04707077 -0.39654306  0.02939145  0.6384388 ]\n",
      "2= tensor([[-2.4987, -3.3377]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05500163 -0.59206223  0.04216023  0.9402308 ]\n",
      "2= tensor([[-2.5173, -3.1648]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06684288 -0.78772634  0.06096484  1.2458576 ]\n",
      "2= tensor([[-2.7067, -3.3174]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0825974  -0.983575    0.08588199  1.5569973 ]\n",
      "2= tensor([[-2.9609, -3.5758]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1022689  -1.1796142   0.11702194  1.8751906 ]\n",
      "2= tensor([[-3.2395, -3.8827]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12586118 -1.3758029   0.15452576  2.201787  ]\n",
      "2= tensor([[-3.5274, -4.2039]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.15337723 -1.5720377   0.19856149  2.5378819 ]\n",
      "2= tensor([[-3.8347, -4.5531]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0365017   0.04375086 -0.01211815  0.03432952]\n",
      "2= tensor([[-3.9089, -6.5816]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03737672 -0.15119523 -0.01143156  0.32316455]\n",
      "2= tensor([[-3.0461, -4.6545]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03435282 -0.34615254 -0.00496827  0.6122206 ]\n",
      "2= tensor([[-2.5634, -3.5135]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02742977 -0.5412047   0.00727615  0.90333456]\n",
      "2= tensor([[-2.4940, -3.1924]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01660567 -0.73642445  0.02534284  1.1982956 ]\n",
      "2= tensor([[-2.6461, -3.2739]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00187718 -0.93186504  0.04930875  1.4988123 ]\n",
      "2= tensor([[-2.8769, -3.4943]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01676012 -1.1275502   0.079285    1.8064742 ]\n",
      "2= tensor([[-3.1480, -3.7908]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03931112 -1.3234624   0.11541448  2.1227047 ]\n",
      "2= tensor([[-3.4273, -4.1001]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06578037 -1.5195284   0.15786858  2.4487038 ]\n",
      "2= tensor([[-3.7202, -4.4292]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09617094 -1.7156026   0.20684265  2.7853785 ]\n",
      "2= tensor([[-4.0503, -4.8057]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [0.04991713 0.03520013 0.04380789 0.01452034]\n",
      "2= tensor([[-3.9301, -6.6377]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.05062113 -0.1605218   0.04409829  0.32069698]\n",
      "2= tensor([[-3.0337, -4.6351]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0474107  -0.35624313  0.05051223  0.62695426]\n",
      "2= tensor([[-2.5593, -3.5002]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04028584 -0.55203235  0.06305131  0.9351078 ]\n",
      "2= tensor([[-2.5277, -3.2415]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02924519 -0.7479455   0.08175347  1.2469184 ]\n",
      "2= tensor([[-2.7057, -3.3616]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01428628 -0.94401515  0.10669184  1.5640494 ]\n",
      "2= tensor([[-2.9601, -3.6248]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00459403 -1.1402386   0.13797283  1.8880188 ]\n",
      "2= tensor([[-3.2435, -3.9404]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0273988  -1.3365643   0.17573321  2.2201443 ]\n",
      "2= tensor([[-3.5387, -4.2726]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02929661  0.02780259 -0.0284861   0.02584784]\n",
      "2= tensor([[-3.8276, -6.3964]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02874056 -0.16689952 -0.02796914  0.30940872]\n",
      "2= tensor([[-2.9895, -4.5197]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03207855 -0.36161202 -0.02178097  0.5931414 ]\n",
      "2= tensor([[-2.5321, -3.4410]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03931079 -0.5564224  -0.00991814  0.87888455]\n",
      "2= tensor([[-2.4737, -3.1296]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05043923 -0.7514082   0.00765955  1.168433  ]\n",
      "2= tensor([[-2.6253, -3.2200]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0654674  -0.946629    0.03102821  1.4635074 ]\n",
      "2= tensor([[-2.8502, -3.4321]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08439998 -1.142117    0.06029836  1.7657192 ]\n",
      "2= tensor([[-3.1178, -3.7167]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10724232 -1.3378663   0.09561274  2.0765264 ]\n",
      "2= tensor([[-3.3927, -4.0197]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.13399965 -1.5338188   0.13714327  2.39718   ]\n",
      "2= tensor([[-3.6798, -4.3403]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.16467603 -1.7298485   0.18508688  2.7286577 ]\n",
      "2= tensor([[-4.0007, -4.7039]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01869598 -0.01651482 -0.04635168  0.01931641]\n",
      "2= tensor([[-12.5263, -15.2672]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01836569 -0.21094245 -0.04596535  0.2970221 ]\n",
      "2= tensor([[-11.3848, -12.4800]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01414684 -0.40538004 -0.04002491  0.57486135]\n",
      "2= tensor([[-11.4606, -11.3653]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00603924 -0.20972049 -0.02852768  0.26984295]\n",
      "2= tensor([[-11.4153, -12.5533]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00184483 -0.40442398 -0.02313082  0.5533933 ]\n",
      "2= tensor([[-11.4505, -11.3700]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00624365 -0.20898497 -0.01206296  0.2535134 ]\n",
      "2= tensor([[-11.4345, -12.5801]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01042335 -0.40393263 -0.00699269  0.54236716]\n",
      "2= tensor([[-11.4615, -11.3742]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.018502   -0.2087131   0.00385466  0.2474892 ]\n",
      "2= tensor([[-11.4433, -12.5626]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02267626 -0.4038899   0.00880444  0.5413855 ]\n",
      "2= tensor([[-11.4965, -11.3824]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03075406 -0.20889278  0.01963215  0.25148964]\n",
      "2= tensor([[-11.4426, -12.5020]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03493192 -0.40428948  0.02466194  0.5502997 ]\n",
      "2= tensor([[-11.5747, -11.4194]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04301771 -0.20952247  0.03566794  0.26548788]\n",
      "2= tensor([[-11.4438, -12.4148]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04720816 -0.40513486  0.04097769  0.569204  ]\n",
      "2= tensor([[-11.6852, -11.4699]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05531086 -0.60080683  0.05236177  0.8745097 ]\n",
      "2= tensor([[-13.4432, -12.4889]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06732699 -0.4064344   0.06985196  0.5987379 ]\n",
      "2= tensor([[-11.8693, -11.5569]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07545568 -0.21235573  0.08182672  0.3288496 ]\n",
      "2= tensor([[-11.4618, -12.1225]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07970279 -0.40854144  0.08840372  0.6461738 ]\n",
      "2= tensor([[-12.1112, -11.6858]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08787362 -0.2147553   0.10132719  0.3825865 ]\n",
      "2= tensor([[-11.5162, -11.9852]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09216873 -0.411159    0.10897892  0.70542026]\n",
      "2= tensor([[-12.5087, -11.9735]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10039191 -0.21770228  0.12308732  0.44893304]\n",
      "2= tensor([[-11.6153, -11.8737]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10474595 -0.4143307   0.13206598  0.7777406 ]\n",
      "2= tensor([[-13.0335, -12.3970]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11303257 -0.22124808  0.1476208   0.5293534 ]\n",
      "2= tensor([[-11.8666, -11.9263]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11745753 -0.41810468  0.15820786  0.86466974]\n",
      "2= tensor([[-13.6578, -12.9050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12581962 -0.22544897  0.17550126  0.6256145 ]\n",
      "2= tensor([[-12.2897, -12.1364]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13032861 -0.03315488  0.18801355  0.392937  ]\n",
      "2= tensor([[-11.9442, -12.7022]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1309917  -0.23037782  0.19587229  0.738509  ]\n",
      "2= tensor([[-12.9057, -12.5788]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01948921  0.01924912  0.01498854 -0.00149604]\n",
      "2= tensor([[-12.7067, -15.5714]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0198742  -0.17608455  0.01495862  0.29587802]\n",
      "2= tensor([[-11.5305, -12.6711]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01635251 -0.3714165   0.02087618  0.59324086]\n",
      "2= tensor([[-11.6260, -11.5200]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00892418 -0.17659292  0.032741    0.30720627]\n",
      "2= tensor([[-11.5267, -12.5836]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00539232 -0.37216574  0.03888512  0.61003244]\n",
      "2= tensor([[-11.7330, -11.5712]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.002051   -0.1776083   0.05108577  0.3298462 ]\n",
      "2= tensor([[-11.5240, -12.4636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00560316 -0.37341884  0.05768269  0.6381915 ]\n",
      "2= tensor([[-11.8893, -11.6494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01307154 -0.17914665  0.07044652  0.36421722]\n",
      "2= tensor([[-11.5327, -12.3246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01665447 -0.37519538  0.07773086  0.6782551 ]\n",
      "2= tensor([[-12.1085, -11.7692]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02415838 -0.18123445  0.09129597  0.41102204]\n",
      "2= tensor([[-11.5747, -12.1924]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02778307 -0.37752405  0.09951641  0.731034  ]\n",
      "2= tensor([[-12.4540, -12.0125]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03533355 -0.18390794  0.11413709  0.47125632]\n",
      "2= tensor([[-11.6726, -12.0814]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03901171 -0.3804414   0.12356222  0.79762185]\n",
      "2= tensor([[-12.9411, -12.4012]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04662054 -0.18721181  0.13951465  0.5462222 ]\n",
      "2= tensor([[-11.8488, -12.0317]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05036477 -0.3839898   0.1504391   0.8794056 ]\n",
      "2= tensor([[-13.5371, -12.8875]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05804457 -0.19119677  0.1680272   0.6375448 ]\n",
      "2= tensor([[-12.2300, -12.2083]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0618685   0.00123305  0.1807781   0.40213305]\n",
      "2= tensor([[-12.0749, -13.0694]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06184385 -0.19593069  0.18882076  0.7459189 ]\n",
      "2= tensor([[-12.7627, -12.5570]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06576246 -0.00384608  0.20373915  0.51809716]\n",
      "2= tensor([[-12.2328, -12.8636]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03365722  0.00090759  0.00081693  0.04546493]\n",
      "2= tensor([[-12.3720, -14.8718]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03363907 -0.19422606  0.00172623  0.3384055 ]\n",
      "2= tensor([[-11.3948, -12.2404]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03752359 -0.38937253  0.00849434  0.63163227]\n",
      "2= tensor([[-11.7671, -11.5017]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04531104 -0.19437012  0.02112699  0.3416365 ]\n",
      "2= tensor([[-11.4138, -12.2063]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04919844 -0.38978618  0.02795972  0.6409061 ]\n",
      "2= tensor([[-11.8562, -11.5476]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05699417 -0.19506495  0.04077784  0.35715744]\n",
      "2= tensor([[-11.4348, -12.1389]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06089547 -0.00054574  0.04792099  0.07760657]\n",
      "2= tensor([[-12.2504, -14.4903]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06090638 -0.19632074  0.04947312  0.38501534]\n",
      "2= tensor([[-11.4504, -12.0594]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06483279 -0.39210886  0.05717343  0.69287735]\n",
      "2= tensor([[-12.1619, -11.7272]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07267497 -0.19782473  0.07103097  0.41872716]\n",
      "2= tensor([[-11.5056, -11.9798]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07663146 -0.39387757  0.07940552  0.73293036]\n",
      "2= tensor([[-12.4776, -11.9648]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08450902 -0.19993733  0.09406412  0.4662574 ]\n",
      "2= tensor([[-11.5918, -11.9039]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08850776 -0.3962537   0.10338927  0.7870442 ]\n",
      "2= tensor([[-12.9039, -12.3108]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09643283 -0.20269245  0.11913016  0.5285951 ]\n",
      "2= tensor([[-11.7795, -11.9160]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10048669 -0.39927122  0.12970206  0.8563148 ]\n",
      "2= tensor([[-13.4286, -12.7395]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10847211 -0.20613247  0.14682835  0.6070657 ]\n",
      "2= tensor([[-12.0992, -12.0527]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11259476 -0.01333547  0.15896967  0.36399448]\n",
      "2= tensor([[-11.9259, -12.8938]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11286147 -0.21031742  0.16624956  0.70228225]\n",
      "2= tensor([[-12.5517, -12.3279]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11706782 -0.01784209  0.1802952   0.46620244]\n",
      "2= tensor([[-12.0312, -12.6667]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11742466 -0.21499218  0.18961924  0.8098542 ]\n",
      "2= tensor([[-13.2076, -12.8414]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1217245  -0.02290366  0.20581633  0.5823005 ]\n",
      "2= tensor([[-12.2767, -12.5747]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00173612  0.00425611 -0.03890987 -0.03963156]\n",
      "2= tensor([[-12.7978, -15.7986]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.001651   -0.1902869  -0.0397025   0.24052545]\n",
      "2= tensor([[-11.4530, -12.7358]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00545673 -0.38481987 -0.03489199  0.5204255 ]\n",
      "2= tensor([[-11.3595, -11.3885]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01315313 -0.57943374 -0.02448348  0.8019124 ]\n",
      "2= tensor([[-12.5695, -11.7647]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02474181 -0.3839847  -0.00844523  0.50162935]\n",
      "2= tensor([[-11.3819, -11.4022]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0324215  -0.5789866   0.00158736  0.7916389 ]\n",
      "2= tensor([[-12.6555, -11.8359]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04400123 -0.3838865   0.01742013  0.49945575]\n",
      "2= tensor([[-11.4338, -11.4102]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05167896 -0.18901439  0.02740925  0.21231325]\n",
      "2= tensor([[-11.4950, -12.6800]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05545925 -0.38451728  0.03165551  0.51351476]\n",
      "2= tensor([[-11.5017, -11.4246]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06314959 -0.18985514  0.04192581  0.23097299]\n",
      "2= tensor([[-11.4867, -12.5687]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0669467  -0.38555032  0.04654527  0.5365804 ]\n",
      "2= tensor([[-11.6033, -11.4575]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07465771 -0.19111268  0.05727688  0.25891915]\n",
      "2= tensor([[-11.4805, -12.4323]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07847996 -0.38700354  0.06245526  0.56910384]\n",
      "2= tensor([[-11.7534, -11.5231]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08622003 -0.19281061  0.07383734  0.29673222]\n",
      "2= tensor([[-11.4729, -12.2627]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09007624 -0.38890323  0.07977198  0.6117582 ]\n",
      "2= tensor([[-11.9478, -11.6125]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09785431 -0.19498149  0.09200715  0.34522867]\n",
      "2= tensor([[-11.4912, -12.0978]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10175394 -0.39128357  0.09891172  0.66544837]\n",
      "2= tensor([[-12.2537, -11.8004]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10957961 -0.19766642  0.11222068  0.40547478]\n",
      "2= tensor([[-11.5649, -11.9656]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11353294 -0.39418602  0.12033018  0.73132366]\n",
      "2= tensor([[-12.7124, -12.1538]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12141666 -0.20091431  0.13495666  0.47880417]\n",
      "2= tensor([[-11.7216, -11.9130]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12543494 -0.39765763  0.14453274  0.8107926 ]\n",
      "2= tensor([[-13.2847, -12.6193]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1333881  -0.20478013  0.16074859  0.56683785]\n",
      "2= tensor([[-12.0439, -12.0324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1374837  -0.01223479  0.17208534  0.32880014]\n",
      "2= tensor([[-11.9187, -12.9254]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.1377284  -0.20933533  0.17866135  0.67042786]\n",
      "2= tensor([[-12.5004, -12.2910]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1419151  -0.01708779  0.1920699   0.43889418]\n",
      "2= tensor([[-12.0138, -12.6615]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14225686 -0.21433526  0.20084779  0.78544664]\n",
      "2= tensor([[-13.1695, -12.8034]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04362293  0.00225865  0.0119299  -0.03993155]\n",
      "2= tensor([[-12.6657, -15.4805]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04357776 -0.19303232  0.01113127  0.25649136]\n",
      "2= tensor([[-11.4434, -12.5122]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0474384  -0.38831142  0.0162611   0.5526644 ]\n",
      "2= tensor([[-11.5582, -11.4201]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05520463 -0.19342156  0.02731439  0.26514882]\n",
      "2= tensor([[-11.4499, -12.4492]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05907306 -0.38892248  0.03261736  0.56632024]\n",
      "2= tensor([[-11.6520, -11.4644]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06685151 -0.19427294  0.04394377  0.28408903]\n",
      "2= tensor([[-11.4508, -12.3470]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07073697 -0.3899932   0.04962555  0.59030133]\n",
      "2= tensor([[-11.7792, -11.5223]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07853683 -0.19559991  0.06143158  0.3136543 ]\n",
      "2= tensor([[-11.4538, -12.2156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08244883 -0.39154074  0.06770466  0.6250606 ]\n",
      "2= tensor([[-11.9470, -11.5994]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09027965 -0.19742604  0.08020587  0.35444564]\n",
      "2= tensor([[-11.4753, -12.0766]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09422817 -0.39359137  0.08729479  0.671303  ]\n",
      "2= tensor([[-12.2265, -11.7744]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10209999 -0.19978446  0.10072085  0.40733165]\n",
      "2= tensor([[-11.5433, -11.9580]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10609569 -0.3961796   0.10886748  0.7299932 ]\n",
      "2= tensor([[-12.6440, -12.0934]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11401927 -0.20271727  0.12346734  0.4734616 ]\n",
      "2= tensor([[-11.6714, -11.8865]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11807362 -0.39934683  0.13293657  0.8023679 ]\n",
      "2= tensor([[-13.1762, -12.5268]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12606056 -0.20627394  0.14898393  0.5542822 ]\n",
      "2= tensor([[-11.9572, -11.9826]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.13018604 -0.4031392   0.16006957  0.8899483 ]\n",
      "2= tensor([[-13.8085, -13.0429]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.13824882 -0.21050878  0.17786855  0.65155625]\n",
      "2= tensor([[-12.4145, -12.2297]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.14245899 -0.01825137  0.19089967  0.41973802]\n",
      "2= tensor([[-11.9914, -12.6882]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.14282402 -0.21549286  0.19929443  0.76600987]\n",
      "2= tensor([[-13.0670, -12.7206]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04868633 -0.04818612  0.04522527 -0.03413713]\n",
      "2= tensor([[-12.6723, -15.4936]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04772261 -0.24392645  0.04454253  0.27246487]\n",
      "2= tensor([[-11.4883, -12.5392]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04284408 -0.04946745  0.04999183 -0.00584316]\n",
      "2= tensor([[-12.5449, -15.2210]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04185473 -0.24526939  0.04987496  0.30218428]\n",
      "2= tensor([[-11.4592, -12.3902]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03694934 -0.05089244  0.05591865  0.02563859]\n",
      "2= tensor([[-12.4276, -14.9448]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03593149 -0.24676986  0.05643142  0.33542702]\n",
      "2= tensor([[-11.4438, -12.2491]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.0309961  -0.44264764  0.06313996  0.64535797]\n",
      "2= tensor([[-11.9368, -11.5906]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02214314 -0.24845973  0.07604712  0.37320736]\n",
      "2= tensor([[-11.4671, -12.1166]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01717395 -0.44457495  0.08351126  0.6888663 ]\n",
      "2= tensor([[-12.2020, -11.7568]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.00828245 -0.25070518  0.09728859  0.42359892]\n",
      "2= tensor([[-11.5303, -11.9952]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00326835 -0.44706106  0.10576057  0.7452977 ]\n",
      "2= tensor([[-12.6008, -12.0528]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00567287 -0.25354517  0.12066653  0.4876814 ]\n",
      "2= tensor([[-11.6361, -11.8860]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01074378 -0.45014453  0.13042015  0.81582606]\n",
      "2= tensor([[-13.1197, -12.4674]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01974667 -0.2570264   0.14673667  0.56684387]\n",
      "2= tensor([[-11.8845, -11.9243]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02488719 -0.45386896  0.15807354  0.9019206 ]\n",
      "2= tensor([[-13.7482, -12.9788]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03396457 -0.26120085  0.17611197  0.6628019 ]\n",
      "2= tensor([[-12.3474, -12.1758]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03918859 -0.0689095   0.189368    0.43033606]\n",
      "2= tensor([[-11.9938, -12.7494]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04056678 -0.26613745  0.19797473  0.77623135]\n",
      "2= tensor([[-13.0000, -12.6515]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.04212084  0.01981043 -0.02956016 -0.04776896]\n",
      "2= tensor([[-13.0361, -16.2337]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.04251705 -0.17487545 -0.03051554  0.23544286]\n",
      "2= tensor([[-11.5727, -13.0225]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03901954 -0.36954844 -0.02580668  0.5183462 ]\n",
      "2= tensor([[-11.3764, -11.5071]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.03162857 -0.56429774 -0.01543976  0.8027865 ]\n",
      "2= tensor([[-12.5160, -11.7778]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02034262 -0.36896747  0.00061597  0.505287  ]\n",
      "2= tensor([[-11.4020, -11.5074]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01296327 -0.5640981   0.01072171  0.798164  ]\n",
      "2= tensor([[-12.6203, -11.8584]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.0016813  -0.3691249   0.02668499  0.5088731 ]\n",
      "2= tensor([[-11.4562, -11.4999]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00570119 -0.56461245  0.03686246  0.8098445 ]\n",
      "2= tensor([[-12.8247, -12.0198]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01699344 -0.37001443  0.05305934  0.52898085]\n",
      "2= tensor([[-11.5518, -11.5047]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02439373 -0.17567751  0.06363896  0.25347784]\n",
      "2= tensor([[-11.5702, -12.6909]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.02790728 -0.3716477   0.06870852  0.5655353 ]\n",
      "2= tensor([[-11.7051, -11.5663]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03534023 -0.17755355  0.08001922  0.29526544]\n",
      "2= tensor([[-11.5516, -12.4944]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0388913  -0.3737197   0.08592454  0.61207366]\n",
      "2= tensor([[-11.9105, -11.6602]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0463657  -0.17989704  0.098166    0.34764305]\n",
      "2= tensor([[-11.5534, -12.2950]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04996364 -0.37626824  0.10511886  0.6695962 ]\n",
      "2= tensor([[-12.2100, -11.8306]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.057489   -0.18275276  0.11851079  0.4117733 ]\n",
      "2= tensor([[-11.6145, -12.1357]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06114406 -0.37933782  0.12674625  0.7393432 ]\n",
      "2= tensor([[-12.6709, -12.1732]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06873082 -0.18617262  0.14153312  0.48908338]\n",
      "2= tensor([[-11.7487, -12.0224]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.07245427 -0.3829779   0.1513148   0.8228114 ]\n",
      "2= tensor([[-13.2661, -12.6576]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08011383 -0.19021398  0.16777101  0.5812864 ]\n",
      "2= tensor([[-12.0612, -12.1134]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08391811 -0.38724008  0.17939675  0.9217696 ]\n",
      "2= tensor([[-13.9636, -13.2257]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09166291 -0.19493619  0.19783214  0.6904033 ]\n",
      "2= tensor([[-12.5853, -12.4156]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03422749 -0.00511248  0.03275306 -0.04836183]\n",
      "2= tensor([[-12.6865, -15.5063]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03432973  0.18952487  0.03178583 -0.33053362]\n",
      "2= tensor([[-15.3914, -20.2771]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03053924 -0.00603478  0.02517515 -0.02799883]\n",
      "2= tensor([[-12.6116, -15.3626]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03065993 -0.20150854  0.02461518  0.27251962]\n",
      "2= tensor([[-11.4502, -12.4608]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0346901  -0.39697292  0.03006557  0.5728635 ]\n",
      "2= tensor([[-11.6508, -11.4662]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04262956 -0.20228514  0.04152284  0.28980175]\n",
      "2= tensor([[-11.4522, -12.3642]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04667526 -0.39797384  0.04731888  0.595286  ]\n",
      "2= tensor([[-11.7742, -11.5227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05463474 -0.20354497  0.05922459  0.31787568]\n",
      "2= tensor([[-11.4541, -12.2344]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05870564 -0.39945826  0.06558211  0.62863225]\n",
      "2= tensor([[-11.9334, -11.5937]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0666948  -0.20530988  0.07815475  0.35730305]\n",
      "2= tensor([[-11.4744, -12.0969]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.070801   -0.40145093  0.08530081  0.67357063]\n",
      "2= tensor([[-12.2039, -11.7604]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07883003 -0.20761164  0.09877223  0.40891692]\n",
      "2= tensor([[-11.5398, -11.9783]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08298226 -0.4039851   0.10695057  0.73103327]\n",
      "2= tensor([[-12.6110, -12.0675]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.09106196 -0.21049099  0.12157123  0.47383404]\n",
      "2= tensor([[-11.6542, -11.8877]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09527177 -0.40710118  0.1310479   0.8022266 ]\n",
      "2= tensor([[-13.1373, -12.4960]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.1034138  -0.21399644  0.14709245  0.553471  ]\n",
      "2= tensor([[-11.9269, -11.9684]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10769373 -0.41084442  0.15816186  0.8886439 ]\n",
      "2= tensor([[-13.7622, -13.0050]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11591062 -0.21818146  0.17593475  0.64956254]\n",
      "2= tensor([[-12.3698, -12.2019]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12027425 -0.02588992  0.188926    0.4170361 ]\n",
      "2= tensor([[-11.9892, -12.7227]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.12079205 -0.22311647  0.19726671  0.7628263 ]\n",
      "2= tensor([[-13.0089, -12.6762]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01220919 -0.03681831  0.01785383  0.02989342]\n",
      "2= tensor([[-12.3983, -14.9324]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01147283 -0.23219168  0.0184517   0.32815552]\n",
      "2= tensor([[-11.3968, -12.2488]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00682899 -0.4275714   0.02501481  0.62659967]\n",
      "2= tensor([[-11.7877, -11.4994]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00172244 -0.23280738  0.03754681  0.34189865]\n",
      "2= tensor([[-11.4105, -12.1741]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00637858 -0.42844284  0.04438478  0.6461812 ]\n",
      "2= tensor([[-11.9090, -11.5565]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01494744 -0.23396654  0.0573084   0.36779886]\n",
      "2= tensor([[-11.4327, -12.0752]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01962677 -0.429854    0.06466438  0.67798716]\n",
      "2= tensor([[-12.1041, -11.6688]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02822385 -0.2356872   0.07822412  0.40634373]\n",
      "2= tensor([[-11.4855, -11.9777]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03293759 -0.4318262   0.086351    0.722627  ]\n",
      "2= tensor([[-12.4398, -11.9187]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.04157412 -0.23799805  0.10080354  0.45832372]\n",
      "2= tensor([[-11.5670, -11.8780]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.04633408 -0.43438974  0.10997001  0.7810019 ]\n",
      "2= tensor([[-12.8780, -12.2631]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05502187 -0.24093743  0.12559006  0.5248423 ]\n",
      "2= tensor([[-11.7420, -11.8590]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05984062 -0.43758222  0.1360869   0.85431284]\n",
      "2= tensor([[-13.4273, -12.7105]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06859227 -0.24455132  0.15317315  0.60732967]\n",
      "2= tensor([[-12.0872, -12.0154]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.0734833  -0.0518652   0.16531974  0.36654148]\n",
      "2= tensor([[-11.9017, -12.8337]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0745206  -0.24890308  0.17265058  0.70645154]\n",
      "2= tensor([[-12.5656, -12.3053]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07949866 -0.05654004  0.1867796   0.47270426]\n",
      "2= tensor([[-12.0207, -12.6090]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08062946 -0.2537408   0.19623369  0.8179551 ]\n",
      "2= tensor([[-13.2706, -12.8619]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.02383349 -0.01939044 -0.04344007  0.01586801]\n",
      "2= tensor([[-12.5379, -15.2927]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.02344568 -0.21386336 -0.04312271  0.29453483]\n",
      "2= tensor([[-11.3913, -12.4952]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.01916841 -0.40834484 -0.03723201  0.5733117 ]\n",
      "2= tensor([[-11.4608, -11.3668]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [ 0.01100151 -0.21272118 -0.02576578  0.2691359 ]\n",
      "2= tensor([[-11.4199, -12.5604]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [ 0.00674709 -0.40746614 -0.02038306  0.5535821 ]\n",
      "2= tensor([[-11.4543, -11.3714]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.00140223 -0.21206398 -0.00931142  0.25454754]\n",
      "2= tensor([[-11.4373, -12.5793]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.00564351 -0.40705174 -0.00422047  0.544279  ]\n",
      "2= tensor([[-11.4691, -11.3755]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.01378455 -0.21187074  0.00666511  0.25026926]\n",
      "2= tensor([[-11.4444, -12.5538]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.01802196 -0.40708724  0.0116705   0.54504704]\n",
      "2= tensor([[-11.5128, -11.3894]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.02616371 -0.2121312   0.02257144  0.25606394]\n",
      "2= tensor([[-11.4419, -12.4850]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.03040633 -0.40756804  0.02769272  0.55577993]\n",
      "2= tensor([[-11.5978, -11.4299]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.03855769 -0.21284561  0.03880832  0.27194893]\n",
      "2= tensor([[-11.4429, -12.3913]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.0428146  -0.4084992   0.0442473   0.57661515]\n",
      "2= tensor([[-11.7149, -11.4830]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.05098459 -0.2140245   0.0557796   0.29819304]\n",
      "2= tensor([[-11.4391, -12.2589]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.05526508 -0.4098954   0.06174346  0.6079331 ]\n",
      "2= tensor([[-11.8663, -11.5501]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.06346299 -0.21568853  0.07390212  0.33531895]\n",
      "2= tensor([[-11.4521, -12.1179]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.06777676 -0.41178018  0.0806085   0.650361  ]\n",
      "2= tensor([[-12.0859, -11.6651]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.07601237 -0.21786803  0.09361572  0.38411054]\n",
      "2= tensor([[-11.5031, -11.9905]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.08036973 -0.41418576  0.10129793  0.7047805 ]\n",
      "2= tensor([[-12.4597, -11.9360]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.08865344 -0.22060248  0.11539354  0.44562486]\n",
      "2= tensor([[-11.5950, -11.8817]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.09306549 -0.41715175  0.12430604  0.77233845]\n",
      "2= tensor([[-12.9526, -12.3297]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.10140852 -0.22393939  0.1397528   0.5212081 ]\n",
      "2= tensor([[-11.8147, -11.9040]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.10588731 -0.4207233   0.15017697  0.8544599 ]\n",
      "2= tensor([[-13.5487, -12.8147]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11430178 -0.22793205  0.16726618  0.6125142 ]\n",
      "2= tensor([[-12.2002, -12.0843]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.11886042 -0.03549381  0.17951645  0.3768327 ]\n",
      "2= tensor([[-11.9253, -12.7580]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n",
      "1= [-0.11957029 -0.23265067  0.1870531   0.7203104 ]\n",
      "2= tensor([[-12.7580, -12.4620]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(1)\n",
      "4= 1\n",
      "1= [-0.12422331 -0.04054118  0.20145932  0.49184623]\n",
      "2= tensor([[-12.0715, -12.5426]], grad_fn=<AddmmBackward0>)\n",
      "3= tensor(0)\n",
      "4= 0\n"
     ]
    }
   ],
   "execution_count": 9
  },
  {
   "cell_type": "code",
   "id": "a101d0e6",
   "metadata": {},
   "source": [
    "play(True)[-1]"
   ],
   "execution_count": 10,
   "outputs": [
    {
     "data": {
      "text/plain": [
       "-973.0"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ]
  },
  {
   "cell_type": "code",
   "id": "908347ed-ac03-4bfa-8d80-0a6889b6061e",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-12-30T06:23:24.439314Z",
     "start_time": "2024-12-30T06:23:24.437243Z"
    }
   },
   "source": [],
   "outputs": [],
   "execution_count": null
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.20"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
